-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathpg-prechecks.sh
498 lines (428 loc) · 19.8 KB
/
pg-prechecks.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
#!/bin/bash
# PostgreSQL Pre-Check Script
# This script collects information about a PostgreSQL instance and generates a summary report.
set -e
# Default values
PGHOST="your-rds-endpoint.region.rds.amazonaws.com"
PGPORT="5432"
PGUSER="your_rds_master_username"
PGDATABASE="postgres"
OUTPUT_DIR="pg_precheck_$(date +%Y%m%d_%H%M%S)"
# Function to execute PostgreSQL queries
run_query() {
psql -h "$PGHOST" -p "$PGPORT" -U "$PGUSER" -d "$PGDATABASE" -t -c "$1"
}
# Function to collect PostgreSQL information
collect_pg_info() {
echo "Collecting PostgreSQL information..."
mkdir -p "$OUTPUT_DIR"
# Check for logical replication support
run_query "SELECT CASE WHEN setting = 'logical' THEN 'Supported' ELSE 'Not supported' END AS logical_replication_support FROM pg_settings WHERE name = 'wal_level';" > "$OUTPUT_DIR/logical_replication.txt"
# Check for number of replicas
run_query "SELECT count(*) FROM pg_stat_replication;" > "$OUTPUT_DIR/replica_count.txt"
# Version information
run_query "SELECT version();" > "$OUTPUT_DIR/version.txt"
# List of databases
run_query "SELECT datname FROM pg_database WHERE datistemplate = false ORDER BY datname;" > "$OUTPUT_DIR/databases.txt"
# Database sizes
run_query "SELECT datname, pg_size_pretty(pg_database_size(datname)) FROM pg_database ORDER BY pg_database_size(datname) DESC;" > "$OUTPUT_DIR/database_sizes.txt"
# Table and index sizes (top 20) with headers
{
echo "Total Number of Indexes: $(run_query "SELECT count(*) FROM pg_indexes;")"
echo "Total Number of Tables: $(run_query "SELECT count(*) FROM pg_tables;")"
echo ""
echo "Table Name | Total Size | Table Size | Index Size"
echo "-----------|------------|------------|------------"
run_query "SELECT schemaname || '.' || tablename AS table_name,
pg_size_pretty(pg_total_relation_size(schemaname || '.' || tablename)) AS total_size,
pg_size_pretty(pg_table_size(schemaname || '.' || tablename)) AS table_size,
pg_size_pretty(pg_indexes_size(schemaname || '.' || tablename)) AS index_size
FROM pg_tables
ORDER BY pg_total_relation_size(schemaname || '.' || tablename) DESC;"
} > "$OUTPUT_DIR/table_index_sizes.txt"
# Settings
run_query "SELECT name, setting, unit, context FROM pg_settings ORDER BY name;" > "$OUTPUT_DIR/settings.txt"
# Extensions
run_query "SELECT * FROM pg_extension;" > "$OUTPUT_DIR/extensions.txt"
# Activity
run_query "SELECT * FROM pg_stat_activity;" > "$OUTPUT_DIR/activity.txt"
# Indexes (with headers and count)
{
echo "Total Number of Indexes: $(run_query "SELECT count(*) FROM pg_indexes;")"
echo ""
echo "Database | Schema | Table | Index Name | Index Size | Index Definition"
echo "----------|--------|--------|------------|------------|------------------"
run_query "SELECT
current_database() as database,
schemaname,
tablename,
indexname,
pg_size_pretty(pg_relation_size(schemaname || '.' || indexname::text)) as index_size,
indexdef
FROM pg_indexes
ORDER BY pg_relation_size(schemaname || '.' || indexname::text) DESC;"
} > "$OUTPUT_DIR/indexes.txt"
# Roles
run_query "SELECT * FROM pg_roles;" > "$OUTPUT_DIR/roles.txt"
# Long-Running Queries
echo "----------------------------------" > "$OUTPUT_DIR/long_running_queries.txt"
echo " Long-Running Queries" >> "$OUTPUT_DIR/long_running_queries.txt"
echo "----------------------------------" >> "$OUTPUT_DIR/long_running_queries.txt"
run_query "SELECT pid,
now() - pg_stat_activity.query_start AS duration,
query
FROM pg_stat_activity
WHERE state != 'idle'
AND now() - pg_stat_activity.query_start > interval '5 minutes'
ORDER BY duration DESC;" >> "$OUTPUT_DIR/long_running_queries.txt"
# Locks Information
echo "----------------------------------" > "$OUTPUT_DIR/locks_information.txt"
echo " Locks Information" >> "$OUTPUT_DIR/locks_information.txt"
echo "----------------------------------" >> "$OUTPUT_DIR/locks_information.txt"
run_query "SELECT l.pid,
locktype,
mode,
granted,
relation::regclass AS table_name,
a.query
FROM pg_locks l
JOIN pg_stat_activity a ON l.pid = a.pid
WHERE relation IS NOT NULL
ORDER BY relation, locktype, mode;" >> "$OUTPUT_DIR/locks_information.txt"
# Total number of active locks
echo "----------------------------------" > "$OUTPUT_DIR/active_locks.txt"
echo " Total Active Locks" >> "$OUTPUT_DIR/active_locks.txt"
echo "----------------------------------" >> "$OUTPUT_DIR/active_locks.txt"
run_query "SELECT count(*) AS active_locks FROM pg_locks WHERE granted = true;" >> "$OUTPUT_DIR/active_locks.txt"
# Max locks per transaction
echo "----------------------------------" > "$OUTPUT_DIR/max_locks_per_transaction.txt"
echo " Max Locks Per Transaction" >> "$OUTPUT_DIR/max_locks_per_transaction.txt"
echo "----------------------------------" >> "$OUTPUT_DIR/max_locks_per_transaction.txt"
run_query "SELECT name, setting, unit FROM pg_settings WHERE name = 'max_locks_per_transaction';" >> "$OUTPUT_DIR/max_locks_per_transaction.txt"
# Check for partitions
echo "----------------------------------" > "$OUTPUT_DIR/partitions.txt"
echo " Partitioned Tables" >> "$OUTPUT_DIR/partitions.txt"
echo "----------------------------------" >> "$OUTPUT_DIR/partitions.txt"
run_query "SELECT parent.relname AS parent_table,
child.relname AS partition_name,
pg_get_expr(child.relpartbound, child.oid) AS partition_expression
FROM pg_inherits
JOIN pg_class parent ON pg_inherits.inhparent = parent.oid
JOIN pg_class child ON pg_inherits.inhrelid = child.oid
JOIN pg_namespace nmsp_parent ON nmsp_parent.oid = parent.relnamespace
JOIN pg_namespace nmsp_child ON nmsp_child.oid = child.relnamespace
WHERE parent.relkind = 'p'
ORDER BY parent.relname, child.relname;" >> "$OUTPUT_DIR/partitions.txt"
# Check for auto-generated columns
echo "----------------------------------" > "$OUTPUT_DIR/auto_generated_columns.txt"
echo " Auto-Generated Columns" >> "$OUTPUT_DIR/auto_generated_columns.txt"
echo "----------------------------------" >> "$OUTPUT_DIR/auto_generated_columns.txt"
run_query "SELECT table_schema, table_name, column_name, data_type, generation_expression
FROM information_schema.columns
WHERE is_generated = 'ALWAYS'
ORDER BY table_schema, table_name, column_name;" >> "$OUTPUT_DIR/auto_generated_columns.txt"
# Check for event triggers
echo "----------------------------------" > "$OUTPUT_DIR/event_triggers.txt"
echo " Event Triggers" >> "$OUTPUT_DIR/event_triggers.txt"
echo "----------------------------------" >> "$OUTPUT_DIR/event_triggers.txt"
run_query "SELECT evtname AS trigger_name,
evtevent AS trigger_event,
evtowner::regrole AS trigger_owner,
evtfoid::regproc AS trigger_function,
evtenabled AS trigger_enabled
FROM pg_event_trigger
ORDER BY evtname;" >> "$OUTPUT_DIR/event_triggers.txt"
# User-defined functions
{
echo "Total Number of User-Defined Functions: $(run_query "SELECT count(*) FROM pg_proc p JOIN pg_namespace n ON p.pronamespace = n.oid WHERE n.nspname NOT IN ('pg_catalog', 'information_schema');")"
echo ""
echo "Database | Schema | Function Name | Return Type | Language | Arguments | Volatility | Parallel | Security | Cost | Rows | Owner | Description"
echo "----------|---------|--------------|-------------|----------|-----------|------------|----------|----------|------|------|--------|-------------"
run_query "SELECT
current_database() as database,
n.nspname as schema,
p.proname as function_name,
pg_get_function_result(p.oid) as return_type,
l.lanname as language,
pg_get_function_arguments(p.oid) as arguments,
CASE p.provolatile
WHEN 'i' THEN 'IMMUTABLE'
WHEN 's' THEN 'STABLE'
WHEN 'v' THEN 'VOLATILE'
END as volatility,
CASE p.proparallel
WHEN 'r' THEN 'RESTRICTED'
WHEN 's' THEN 'SAFE'
WHEN 'u' THEN 'UNSAFE'
END as parallel,
CASE WHEN p.prosecdef THEN 'SECURITY DEFINER' ELSE 'SECURITY INVOKER' END as security,
p.procost as cost,
p.prorows as estimated_rows,
pg_get_userbyid(p.proowner) as owner,
d.description as description
FROM pg_proc p
JOIN pg_namespace n ON p.pronamespace = n.oid
JOIN pg_language l ON p.prolang = l.oid
LEFT JOIN pg_description d ON p.oid = d.objoid
WHERE n.nspname NOT IN ('pg_catalog', 'information_schema')
ORDER BY n.nspname, p.proname;"
} > "$OUTPUT_DIR/user_defined_functions.txt"
# Also add function source code in a separate file
{
echo "User-Defined Functions Source Code"
echo "================================="
echo ""
run_query "SELECT pg_get_functiondef(f.oid) FROM pg_catalog.pg_proc f INNER JOIN pg_catalog.pg_namespace n ON (f.pronamespace = n.oid) WHERE n.nspname = 'public';"
} > "$OUTPUT_DIR/user_defined_functions_source.txt"
# Sequences information
{
echo "Total Number of Sequences: $(run_query "SELECT count(*) FROM pg_sequences;")"
echo ""
echo "Database | Schema | Sequence Name | Data Type | Start Value | Min Value | Max Value | Increment | Cycle | Cache | Last Value"
echo "----------|---------|---------------|------------|-------------|-----------|------------|-----------|--------|--------|------------"
run_query "SELECT
current_database() as database,
schemaname as schema,
sequencename as sequence_name,
data_type,
start_value,
min_value,
max_value,
increment_by,
CASE WHEN cycle THEN 'YES' ELSE 'NO' END as cycle,
cache_size as cache,
last_value
FROM pg_sequences
ORDER BY schemaname, sequencename;"
} > "$OUTPUT_DIR/sequences.txt"
}
# Function to generate summary report
generate_report() {
echo "Generating summary report..."
{
echo "# PostgreSQL Pre-Check Report"
echo "Date: $(date)"
echo
echo "## Version"
cat "$OUTPUT_DIR/version.txt"
echo
echo "## Databases"
cat "$OUTPUT_DIR/databases.txt"
echo
echo "## Database Sizes"
cat "$OUTPUT_DIR/database_sizes.txt"
echo
echo "## Top 20 Table and Index Sizes"
cat "$OUTPUT_DIR/table_index_sizes.txt"
echo
echo "## Notable Settings"
grep -E "(max_connections|shared_buffers|work_mem|maintenance_work_mem|effective_cache_size)" "$OUTPUT_DIR/settings.txt"
echo
echo "## Installed Extensions"
cat "$OUTPUT_DIR/extensions.txt"
echo
echo "## Current Activity Summary"
grep -c . "$OUTPUT_DIR/activity.txt"
echo "active connections"
echo
echo "## Index Count"
wc -l < "$OUTPUT_DIR/indexes.txt"
echo "total indexes"
echo
echo "## User Roles"
cat "$OUTPUT_DIR/roles.txt"
echo
echo "## Logical Replication Support"
cat "$OUTPUT_DIR/logical_replication.txt"
echo
echo "## Number of Replicas"
cat "$OUTPUT_DIR/replica_count.txt"
echo "active replicas"
echo
echo "## Long-Running Queries"
cat "$OUTPUT_DIR/long_running_queries.txt"
echo
echo "## Max Locks Per Transaction"
cat "$OUTPUT_DIR/max_locks_per_transaction.txt"
echo
echo "## Total Active Locks"
cat "$OUTPUT_DIR/active_locks.txt"
echo
echo "## Locks Information"
cat "$OUTPUT_DIR/locks_information.txt"
echo
echo "## Partitioned Tables"
if [ -s "$OUTPUT_DIR/partitions.txt" ]; then
cat "$OUTPUT_DIR/partitions.txt"
else
echo "No partitioned tables found."
fi
echo
echo "## Auto-Generated Columns"
if [ -s "$OUTPUT_DIR/auto_generated_columns.txt" ]; then
cat "$OUTPUT_DIR/auto_generated_columns.txt"
else
echo "No auto-generated columns found."
fi
echo
echo "## Event Triggers"
if [ -s "$OUTPUT_DIR/event_triggers.txt" ]; then
cat "$OUTPUT_DIR/event_triggers.txt"
else
echo "No event triggers found."
fi
echo
echo "## User-Defined Functions"
if [ -s "$OUTPUT_DIR/user_defined_functions.txt" ]; then
cat "$OUTPUT_DIR/user_defined_functions.txt"
else
echo "No user-defined functions found."
fi
echo
echo "## User-Defined Functions Source Code"
if [ -s "$OUTPUT_DIR/user_defined_functions_source.txt" ]; then
cat "$OUTPUT_DIR/user_defined_functions_source.txt"
else
echo "No user-defined functions source code found."
fi
echo
} > "$OUTPUT_DIR/summary_report.md"
echo "Summary report generated: $OUTPUT_DIR/summary_report.md"
}
# Function to perform a version-agnostic dump
perform_version_agnostic_dump() {
echo "Performing database dump..."
DUMP_FILE="$OUTPUT_DIR/database_dump.sql"
# Dump schema (keep this part as it was)
echo "-- Schema dump" > "$DUMP_FILE"
PGPASSWORD=$PGPASSWORD psql -h "$PGHOST" -p "$PGPORT" -U "$PGUSER" -d "$PGDATABASE" -t -c "
-- Schemas
SELECT 'CREATE SCHEMA IF NOT EXISTS ' || quote_ident(nspname) || ';'
FROM pg_namespace
WHERE nspname NOT IN ('public', 'information_schema', 'pg_catalog', 'pg_toast');
-- Tables
SELECT 'CREATE TABLE ' || quote_ident(n.nspname) || '.' || quote_ident(c.relname) || ' (' ||
string_agg(quote_ident(a.attname) || ' ' || pg_catalog.format_type(a.atttypid, a.atttypmod) ||
CASE WHEN a.attnotnull THEN ' NOT NULL' ELSE '' END ||
CASE WHEN ad.adbin IS NOT NULL THEN ' DEFAULT ' || pg_get_expr(ad.adbin, ad.adrelid) ELSE '' END,
', ') || ');'
FROM pg_class c
JOIN pg_namespace n ON c.relnamespace = n.oid
JOIN pg_attribute a ON c.oid = a.attrelid
LEFT JOIN pg_attrdef ad ON a.attrelid = ad.adrelid AND a.attnum = ad.adnum
WHERE c.relkind = 'r' AND a.attnum > 0 AND NOT a.attisdropped
AND n.nspname NOT IN ('pg_catalog', 'information_schema')
GROUP BY n.nspname, c.relname, c.oid;
-- Indexes
SELECT pg_get_indexdef(i.indexrelid)
FROM pg_index i
JOIN pg_class c ON i.indexrelid = c.oid
JOIN pg_namespace n ON c.relnamespace = n.oid
WHERE n.nspname NOT IN ('pg_catalog', 'information_schema');
-- Views
SELECT 'CREATE OR REPLACE VIEW ' || quote_ident(n.nspname) || '.' || quote_ident(c.relname) || ' AS ' ||
pg_get_viewdef(c.oid)
FROM pg_class c
JOIN pg_namespace n ON c.relnamespace = n.oid
WHERE c.relkind = 'v' AND n.nspname NOT IN ('pg_catalog', 'information_schema');
-- Functions
SELECT 'CREATE OR REPLACE FUNCTION ' || quote_ident(n.nspname) || '.' || quote_ident(p.proname) || '(' ||
pg_get_function_arguments(p.oid) || ') RETURNS ' || pg_get_function_result(p.oid) || ' AS $BODY$' ||
pg_get_functiondef(p.oid) || '$BODY$ LANGUAGE ' || l.lanname || ';'
FROM pg_proc p
JOIN pg_namespace n ON p.pronamespace = n.oid
JOIN pg_language l ON p.prolang = l.oid
WHERE n.nspname NOT IN ('pg_catalog', 'information_schema');
" >> "$DUMP_FILE"
# Dump data (modified part)
echo "-- Data dump" >> "$DUMP_FILE"
PGPASSWORD=$PGPASSWORD psql -h "$PGHOST" -p "$PGPORT" -U "$PGUSER" -d "$PGDATABASE" -t -c "
SELECT quote_ident(n.nspname) || '.' || quote_ident(c.relname) AS full_table_name
FROM pg_class c
JOIN pg_namespace n ON c.relnamespace = n.oid
WHERE c.relkind = 'r' AND n.nspname NOT IN ('pg_catalog', 'information_schema');" | while read -r table; do
if [ -n "$table" ]; then
echo "Dumping data for table: $table"
echo "COPY $table FROM stdin;" >> "$DUMP_FILE"
PGPASSWORD=$PGPASSWORD psql -h "$PGHOST" -p "$PGPORT" -U "$PGUSER" -d "$PGDATABASE" -c "COPY $table TO STDOUT;" >> "$DUMP_FILE"
echo "\\." >> "$DUMP_FILE"
fi
done
if [ $? -eq 0 ]; then
echo "Database dump completed successfully. Dump file: $DUMP_FILE"
else
echo "Error: Database dump failed. Please check your permissions and connection details."
return 1
fi
}
# New function to capture \d+ output
capture_table_details() {
echo "Capturing detailed table information..."
TABLE_DETAILS_FILE="$OUTPUT_DIR/table_details.txt"
echo "Detailed Table Information" > "$TABLE_DETAILS_FILE"
echo "===========================" >> "$TABLE_DETAILS_FILE"
echo "" >> "$TABLE_DETAILS_FILE"
# Get list of all tables
tables=$(PGPASSWORD=$PGPASSWORD psql -h "$PGHOST" -p "$PGPORT" -U "$PGUSER" -d "$PGDATABASE" -t -c "SELECT schemaname || '.' || tablename FROM pg_tables WHERE schemaname NOT IN ('pg_catalog', 'information_schema') ORDER BY schemaname, tablename;")
# Loop through each table and capture \d+ output
while read -r table; do
if [ -n "$table" ]; then
echo "Table: $table" >> "$TABLE_DETAILS_FILE"
echo "------------------------" >> "$TABLE_DETAILS_FILE"
PGPASSWORD=$PGPASSWORD psql -h "$PGHOST" -p "$PGPORT" -U "$PGUSER" -d "$PGDATABASE" -c "\d+ $table" >> "$TABLE_DETAILS_FILE"
echo "" >> "$TABLE_DETAILS_FILE"
fi
done <<< "$tables"
echo "Detailed table information captured in: $TABLE_DETAILS_FILE"
}
# Modify the main function to include the new capture_table_details function
main() {
collect_pg_info
capture_table_details
generate_report
if [ "$PERFORM_DUMP" = true ]; then
perform_version_agnostic_dump
fi
echo "Pre-check completed. Please review the summary report and table details."
}
# Parse command line arguments
PERFORM_DUMP=false
while [[ $# -gt 0 ]]; do
case $1 in
--host=*)
PGHOST="${1#*=}"
shift
;;
--port=*)
PGPORT="${1#*=}"
shift
;;
--user=*)
PGUSER="${1#*=}"
shift
;;
--dbname=*)
PGDATABASE="${1#*=}"
shift
;;
--password=*)
export PGPASSWORD="${1#*=}"
shift
;;
--dump)
PERFORM_DUMP=true
shift
;;
*)
echo "Unknown parameter: $1"
exit 1
;;
esac
done
# Check if required parameters are set
if [ -z "$PGHOST" ] || [ -z "$PGUSER" ] || [ -z "$PGPASSWORD" ]; then
echo "Error: Host, user, and password are required. Use --host=, --user=, and --password= parameters."
exit 1
fi
# Run the main function
main