db-performance-watchlist

安装量: 35
排名: #19670

安装

npx skills add https://github.com/patricio0312rev/skills --skill db-performance-watchlist
DB Performance Watchlist
Monitor database performance and prevent regressions.
Key Performance Metrics
// performance-metrics.ts
export
interface
DBMetrics
{
// Query Performance
slowQueries
:
{
threshold
:
number
;
// ms
count
:
number
;
queries
:
SlowQuery
[
]
;
}
;
// Connection Pool
connections
:
{
active
:
number
;
idle
:
number
;
total
:
number
;
maxConnections
:
number
;
utilizationPercent
:
number
;
}
;
// Resource Usage
resources
:
{
cpuPercent
:
number
;
memoryPercent
:
number
;
diskUsagePercent
:
number
;
iops
:
number
;
}
;
// Query Statistics
queryStats
:
{
selectsPerSecond
:
number
;
insertsPerSecond
:
number
;
updatesPerSecond
:
number
;
deletesPerSecond
:
number
;
}
;
// Cache Performance
cache
:
{
hitRate
:
number
;
// %
size
:
number
;
// MB
evictions
:
number
;
}
;
// Index Usage
indexes
:
{
unusedIndexes
:
string
[
]
;
missingIndexes
:
string
[
]
;
}
;
}
interface
SlowQuery
{
query
:
string
;
duration
:
number
;
calls
:
number
;
avgDuration
:
number
;
table
:
string
;
}
Slow Query Detection
// scripts/detect-slow-queries.ts
async
function
detectSlowQueries
(
thresholdMs
:
number
=
100
)
{
// Enable slow query logging (PostgreSQL)
await
prisma
.
$executeRaw
`
ALTER DATABASE mydb
SET log_min_duration_statement =
${
thresholdMs
}
;
`
;
// Query pg_stat_statements for slow queries
const
slowQueries
=
await
prisma
.
$queryRaw
<
SlowQuery
[
]
>
`
SELECT
query,
calls,
total_exec_time / 1000 as total_time_ms,
mean_exec_time / 1000 as avg_time_ms,
max_exec_time / 1000 as max_time_ms,
(total_exec_time / sum(total_exec_time) OVER()) * 100 as percent_of_total
FROM pg_stat_statements
WHERE mean_exec_time >
${
thresholdMs
}
ORDER BY mean_exec_time DESC
LIMIT 20
`
;
console
.
log
(
"🐌 Slow Queries Detected:\n"
)
;
slowQueries
.
forEach
(
(
q
,
i
)
=>
{
console
.
log
(
`
${
i
+
1
}
.
${
q
.
query
.
substring
(
0
,
80
)
}
...
`
)
;
console
.
log
(
`
Calls:
${
q
.
calls
}
`
)
;
console
.
log
(
`
Avg:
${
q
.
avg_time_ms
.
toFixed
(
2
)
}
ms
`
)
;
console
.
log
(
`
Max:
${
q
.
max_time_ms
.
toFixed
(
2
)
}
ms
`
)
;
console
.
log
(
`
% of total time:
${
q
.
percent_of_total
.
toFixed
(
1
)
}
%\n
`
)
;
}
)
;
return
slowQueries
;
}
Connection Pool Monitoring
async
function
monitorConnectionPool
(
)
{
const
stats
=
await
prisma
.
$queryRaw
<
any
[
]
>
`
SELECT
sum(numbackends) as total_connections,
sum(CASE WHEN state = 'active' THEN 1 ELSE 0 END) as active,
sum(CASE WHEN state = 'idle' THEN 1 ELSE 0 END) as idle,
max_connections
FROM pg_stat_database
CROSS JOIN (SELECT setting::int as max_connections FROM pg_settings WHERE name = 'max_connections')
WHERE datname = current_database()
GROUP BY max_connections
`
;
const
{
total_connections
,
active
,
idle
,
max_connections
}
=
stats
[
0
]
;
const
utilization
=
(
total_connections
/
max_connections
)
*
100
;
console
.
log
(
"🔌 Connection Pool Status:"
)
;
console
.
log
(
`
Total:
${
total_connections
}
/
${
max_connections
}
(
${
utilization
.
toFixed
(
1
)
}
%)
`
)
;
console
.
log
(
`
Active:
${
active
}
`
)
;
console
.
log
(
`
Idle:
${
idle
}
`
)
;
// Alert if > 80% utilization
if
(
utilization
>
80
)
{
console
.
warn
(
"⚠️ Connection pool >80% utilized!"
)
;
await
sendAlert
(
{
title
:
"High connection pool usage"
,
message
:
`
${
utilization
.
toFixed
(
1
)
}
% of connections in use
`
,
}
)
;
}
}
Resource Monitoring
async
function
monitorResources
(
)
{
// CPU Usage
const
cpuStats
=
await
prisma
.
$queryRaw
<
any
[
]
>
`
SELECT
(sum(total_exec_time) / (extract(epoch from (now() - stats_reset)) * 1000 * 100)) as cpu_percent
FROM pg_stat_statements, pg_stat_database
WHERE datname = current_database()
`
;
// Memory Usage
const
memStats
=
await
prisma
.
$queryRaw
<
any
[
]
>
`
SELECT
pg_size_pretty(pg_database_size(current_database())) as db_size,
pg_size_pretty(sum(pg_relation_size(schemaname||'.'||tablename))) as tables_size
FROM pg_tables
WHERE schemaname = 'public'
`
;
// Cache Hit Rate
const
cacheStats
=
await
prisma
.
$queryRaw
<
any
[
]
>
`
SELECT
sum(heap_blks_hit) / (sum(heap_blks_hit) + sum(heap_blks_read)) * 100 as cache_hit_rate
FROM pg_statio_user_tables
`
;
console
.
log
(
"📊 Resource Usage:"
)
;
console
.
log
(
`
CPU:
${
cpuStats
[
0
]
.
cpu_percent
.
toFixed
(
1
)
}
%
`
)
;
console
.
log
(
`
Database Size:
${
memStats
[
0
]
.
db_size
}
`
)
;
console
.
log
(
`
Cache Hit Rate:
${
cacheStats
[
0
]
.
cache_hit_rate
.
toFixed
(
1
)
}
%
`
)
;
// Alert if cache hit rate < 90%
if
(
cacheStats
[
0
]
.
cache_hit_rate
<
90
)
{
console
.
warn
(
"⚠️ Cache hit rate below 90%!"
)
;
await
sendAlert
(
{
title
:
"Low cache hit rate"
,
message
:
`
Cache hit rate:
${
cacheStats
[
0
]
.
cache_hit_rate
.
toFixed
(
1
)
}
%
`
,
}
)
;
}
}
Index Usage Analysis
async
function
analyzeIndexUsage
(
)
{
// Find unused indexes
const
unusedIndexes
=
await
prisma
.
$queryRaw
<
any
[
]
>
`
SELECT
schemaname,
tablename,
indexname,
idx_scan
FROM pg_stat_user_indexes
WHERE idx_scan = 0
AND indexname NOT LIKE '%_pkey'
ORDER BY pg_relation_size(indexrelid) DESC
`
;
console
.
log
(
"🗂️ Unused Indexes:\n"
)
;
unusedIndexes
.
forEach
(
(
idx
)
=>
{
console
.
log
(
`
${
idx
.
tablename
}
.
${
idx
.
indexname
}
(0 scans)
`
)
;
}
)
;
// Find missing indexes (sequential scans on large tables)
const
missingIndexes
=
await
prisma
.
$queryRaw
<
any
[
]
>
`
SELECT
schemaname,
tablename,
seq_scan,
seq_tup_read,
idx_scan,
n_live_tup
FROM pg_stat_user_tables
WHERE seq_scan > 1000
AND n_live_tup > 10000
ORDER BY seq_scan * n_live_tup DESC
LIMIT 10
`
;
console
.
log
(
"\n📉 Tables with High Sequential Scans:\n"
)
;
missingIndexes
.
forEach
(
(
table
)
=>
{
console
.
log
(
`
${
table
.
tablename
}
:
`
)
;
console
.
log
(
`
Sequential scans:
${
table
.
seq_scan
}
`
)
;
console
.
log
(
`
Rows:
${
table
.
n_live_tup
}
`
)
;
console
.
log
(
`
Index scans:
${
table
.
idx_scan
}
`
)
;
}
)
;
}
Alert Thresholds
const
ALERT_THRESHOLDS
=
{
slowQuery
:
{
avgDuration
:
500
,
// ms
maxDuration
:
2000
,
// ms
callsPerMinute
:
100
,
}
,
connections
:
{
utilizationWarning
:
70
,
// %
utilizationCritical
:
85
,
// %
}
,
resources
:
{
cpuWarning
:
70
,
// %
cpuCritical
:
85
,
// %
memoryWarning
:
80
,
// %
memoryCritical
:
90
,
// %
diskWarning
:
75
,
// %
diskCritical
:
85
,
// %
}
,
cache
:
{
hitRateWarning
:
90
,
// %
hitRateCritical
:
80
,
// %
}
,
queryRate
:
{
maxSelectsPerSecond
:
10000
,
maxWritesPerSecond
:
1000
,
}
,
}
;
async
function
checkThresholds
(
)
{
const
metrics
=
await
gatherMetrics
(
)
;
// Check slow queries
if
(
metrics
.
slowQueries
.
count
>
10
)
{
await
sendAlert
(
{
level
:
"warning"
,
title
:
"Slow queries detected"
,
message
:
`
${
metrics
.
slowQueries
.
count
}
queries exceeding
${
ALERT_THRESHOLDS
.
slowQuery
.
avgDuration
}
ms
`
,
}
)
;
}
// Check connection pool
if
(
metrics
.
connections
.
utilizationPercent
>
ALERT_THRESHOLDS
.
connections
.
utilizationCritical
)
{
await
sendAlert
(
{
level
:
"critical"
,
title
:
"Connection pool critical"
,
message
:
`
${
metrics
.
connections
.
utilizationPercent
.
toFixed
(
1
)
}
% utilization
`
,
}
)
;
}
// Check cache hit rate
if
(
metrics
.
cache
.
hitRate
<
ALERT_THRESHOLDS
.
cache
.
hitRateCritical
)
{
await
sendAlert
(
{
level
:
"critical"
,
title
:
"Cache hit rate critical"
,
message
:
`
${
metrics
.
cache
.
hitRate
.
toFixed
(
1
)
}
% hit rate
`
,
}
)
;
}
}
Monitoring Dashboard
// Generate monitoring report
async
function
generatePerformanceReport
(
)
{
console
.
log
(
"📊 Database Performance Report\n"
)
;
console
.
log
(
"="
.
repeat
(
50
)
+
"\n"
)
;
// Slow queries
const
slowQueries
=
await
detectSlowQueries
(
100
)
;
console
.
log
(
`
Slow Queries (>100ms):
${
slowQueries
.
length
}
\n
`
)
;
// Connection pool
await
monitorConnectionPool
(
)
;
console
.
log
(
)
;
// Resources
await
monitorResources
(
)
;
console
.
log
(
)
;
// Index usage
await
analyzeIndexUsage
(
)
;
console
.
log
(
)
;
// Query rates
const
queryStats
=
await
prisma
.
$queryRaw
<
any
[
]
>
`
SELECT
sum(xact_commit + xact_rollback) as transactions,
sum(tup_returned) as rows_read,
sum(tup_inserted) as rows_inserted,
sum(tup_updated) as rows_updated,
sum(tup_deleted) as rows_deleted
FROM pg_stat_database
WHERE datname = current_database()
`
;
console
.
log
(
"📈 Query Statistics:"
)
;
console
.
log
(
`
Transactions:
${
queryStats
[
0
]
.
transactions
}
`
)
;
console
.
log
(
`
Rows read:
${
queryStats
[
0
]
.
rows_read
}
`
)
;
console
.
log
(
`
Rows inserted:
${
queryStats
[
0
]
.
rows_inserted
}
`
)
;
console
.
log
(
`
Rows updated:
${
queryStats
[
0
]
.
rows_updated
}
`
)
;
console
.
log
(
`
Rows deleted:
${
queryStats
[
0
]
.
rows_deleted
}
`
)
;
}
Automated Monitoring Script
// scripts/monitor-db.ts
import
cron
from
"node-cron"
;
// Run every 5 minutes
cron
.
schedule
(
"/5 * * * "
,
async
(
)
=>
{
await
checkThresholds
(
)
;
}
)
;
// Generate report every hour
cron
.
schedule
(
"0 * * * *"
,
async
(
)
=>
{
await
generatePerformanceReport
(
)
;
}
)
;
// Analyze indexes weekly
cron
.
schedule
(
"0 0 * * 0"
,
async
(
)
=>
{
await
analyzeIndexUsage
(
)
;
}
)
;
Grafana Dashboard Queries
-- Query latency over time
SELECT
bucket
,
AVG
(
mean_exec_time
)
as
avg_latency
,
MAX
(
max_exec_time
)
as
max_latency
,
SUM
(
calls
)
as
total_calls
FROM
pg_stat_statements
WHERE
query
NOT
LIKE
'%pg_stat_statements%'
GROUP
BY
time_bucket
(
'5 minutes'
,
queryid
)
ORDER
BY
bucket
;
-- Connection count over time
SELECT
now
(
)
as
time
,
count
(
*
)
as
total
,
count
(
*
)
FILTER
(
WHERE
state
=
'active'
)
as
active
,
count
(
*
)
FILTER
(
WHERE
state
=
'idle'
)
as
idle
FROM
pg_stat_activity
;
-- Cache hit rate
SELECT
sum
(
heap_blks_hit
)
/
(
sum
(
heap_blks_hit
)
+
sum
(
heap_blks_read
)
)
*
100
as
cache_hit_rate
FROM
pg_statio_user_tables
;
Best Practices
Monitor continuously
Don't wait for problems
Set appropriate thresholds
Based on your SLAs
Alert on trends
Not just absolute values
Review regularly
Weekly performance reviews
Automate everything
No manual checks
Document baselines
Know what's normal
Test alerts
Ensure they work Output Checklist Slow query detection configured Connection pool monitoring Resource usage tracking Cache hit rate monitoring Index usage analysis Alert thresholds defined Monitoring dashboard setup Automated checks scheduled Grafana/alerting integration Performance baseline documented
返回排行榜