chrisberkhout/heroku-pg-extras-bloat.sql

## heroku-pg-extras-bloat.sql
-- show table and index bloat in your database ordered by most wasteful
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
WITH constants AS (
  SELECT current_setting('block_size')::numeric AS bs, 23 AS hdr, 4 AS ma
), bloat_info AS (
  SELECT
    ma,bs,schemaname,tablename,
    (datawidth+(hdr+ma-(case when hdr%ma=0 THEN ma ELSE hdr%ma END)))::numeric AS datahdr,
    (maxfracsum*(nullhdr+ma-(case when nullhdr%ma=0 THEN ma ELSE nullhdr%ma END))) AS nullhdr2
  FROM (
    SELECT
      schemaname, tablename, hdr, ma, bs,
      SUM((1-null_frac)*avg_width) AS datawidth,
      MAX(null_frac) AS maxfracsum,
      hdr+(
        SELECT 1+count(*)/8
        FROM pg_stats s2
        WHERE null_frac<>0 AND s2.schemaname = s.schemaname AND s2.tablename = s.tablename
      ) AS nullhdr
    FROM pg_stats s, constants
    GROUP BY 1,2,3,4,5
  ) AS foo
), table_bloat AS (
  SELECT
    schemaname, tablename, cc.relpages, bs,
    CEIL((cc.reltuples*((datahdr+ma-
      (CASE WHEN datahdr%ma=0 THEN ma ELSE datahdr%ma END))+nullhdr2+4))/(bs-20::float)) AS otta
  FROM bloat_info
  JOIN pg_class cc ON cc.relname = bloat_info.tablename
  JOIN pg_namespace nn ON cc.relnamespace = nn.oid AND nn.nspname = bloat_info.schemaname AND nn.nspname <> 'information_schema'
), index_bloat AS (
  SELECT
    schemaname, tablename, bs,
    COALESCE(c2.relname,'?') AS iname, COALESCE(c2.reltuples,0) AS ituples, COALESCE(c2.relpages,0) AS ipages,
    COALESCE(CEIL((c2.reltuples*(datahdr-12))/(bs-20::float)),0) AS iotta -- very rough approximation, assumes all cols
  FROM bloat_info
  JOIN pg_class cc ON cc.relname = bloat_info.tablename
  JOIN pg_namespace nn ON cc.relnamespace = nn.oid AND nn.nspname = bloat_info.schemaname AND nn.nspname <> 'information_schema'
  JOIN pg_index i ON indrelid = cc.oid
  JOIN pg_class c2 ON c2.oid = i.indexrelid
)
SELECT
  type, schemaname, object_name, bloat, pg_size_pretty(raw_waste) as waste
FROM (
  SELECT
    'table' as type,
    schemaname,
    tablename as object_name,
    ROUND(CASE WHEN otta=0 THEN 0.0 ELSE table_bloat.relpages/otta::numeric END,1) AS bloat,
    CASE WHEN relpages < otta THEN '0' ELSE (bs*(table_bloat.relpages-otta)::bigint)::bigint END AS raw_waste
  FROM table_bloat
  UNION
  SELECT
    'index' as type,
    schemaname,
    tablename || '::' || iname as object_name,
    ROUND(CASE WHEN iotta=0 OR ipages=0 THEN 0.0 ELSE ipages/iotta::numeric END,1) AS bloat,
    CASE WHEN ipages < iotta THEN '0' ELSE (bs*(ipages-iotta))::bigint END AS raw_waste
  FROM index_bloat
) bloat_summary
ORDER BY raw_waste DESC, bloat DESC
;

## heroku-pg-extras-blocking.sql
-- display queries holding locks other queries are waiting to be released
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
-- assumes pg >= 9.2
SELECT bl.pid AS blocked_pid,
  ka.query AS blocking_statement,
  now() - ka.query_start AS blocking_duration,
  kl.pid AS blocking_pid,
  a.query AS blocked_statement,
  now() - a.query_start AS blocked_duration
FROM pg_catalog.pg_locks bl
JOIN pg_catalog.pg_stat_activity a
  ON bl.pid = a.pid
JOIN pg_catalog.pg_locks kl
  JOIN pg_catalog.pg_stat_activity ka
    ON kl.pid = ka.pid
ON bl.transactionid = kl.transactionid AND bl.pid != kl.pid
WHERE NOT bl.granted

## heroku-pg-extras-cache_hit.sql
-- calculates your cache hit rate (effective databases are at 99% and up)
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
SELECT
  'index hit rate' AS name,
  (sum(idx_blks_hit)) / sum(idx_blks_hit + idx_blks_read) AS ratio
FROM pg_statio_user_indexes
UNION ALL
SELECT
 'cache hit rate' AS name,
  sum(heap_blks_hit) / (sum(heap_blks_hit) + sum(heap_blks_read)) AS ratio
FROM pg_statio_user_tables;

## heroku-pg-extras-index_size.sql
-- show the size of indexes, descending by size
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
SELECT relname AS name,
  pg_size_pretty(sum(relpages::bigint*8192)::bigint) AS size
FROM pg_class
WHERE reltype = 0
GROUP BY relname
ORDER BY sum(relpages) DESC;

## heroku-pg-extras-index_usage.sql
-- calculates your index hit rate (effective databases are at 99% and up)
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
SELECT relname,
  CASE idx_scan
    WHEN 0 THEN 'Insufficient data'
    ELSE (100 * idx_scan / (seq_scan + idx_scan))::text
  END percent_of_times_index_used,
  n_live_tup rows_in_table
FROM
  pg_stat_user_tables
ORDER BY
  n_live_tup DESC;

## heroku-pg-extras-killall.sql
-- terminates ALL connections
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
-- assumes pg >= 9.2
SELECT pg_terminate_backend(pid)
FROM pg_stat_activity
WHERE pid <> pg_backend_pid()
  AND query <> '<insufficient privilege>'
;

## heroku-pg-extras-locks.sql
-- display queries with active locks
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
-- assumes pg >= 9.2
SELECT
  pg_stat_activity.pid,
  pg_class.relname,
  pg_locks.transactionid,
  pg_locks.granted,
  substr(pg_stat_activity.query,1,30) AS query_snippet,
  age(now(),pg_stat_activity.query_start) AS "age"
FROM pg_stat_activity,pg_locks left
OUTER JOIN pg_class
  ON (pg_locks.relation = pg_class.oid)
WHERE pg_stat_activity.query <> '<insufficient privilege>'
  AND pg_locks.pid = pg_stat_activity.pid
  AND pg_locks.mode = 'ExclusiveLock' order by query_start;

## heroku-pg-extras-long_running_queries.sql
-- show all queries taking longer than five minutes ordered by duration descending
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
-- assumes pg >= 9.2
SELECT
  pid,
  now() - pg_stat_activity.query_start AS duration,
  query AS query
FROM
  pg_stat_activity
WHERE
  pg_stat_activity.query <> ''::text
  AND state <> 'idle'
  AND now() - pg_stat_activity.query_start > interval '5 minutes'
ORDER BY
  now() - pg_stat_activity.query_start DESC
;

## heroku-pg-extras-mandelbrot.sql
-- show the mandelbrot set
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
WITH RECURSIVE Z(IX, IY, CX, CY, X, Y, I) AS (
    SELECT IX, IY, X::float, Y::float, X::float, Y::float, 0
    FROM (select -2.2 + 0.031 * i, i from generate_series(0,101) as i) as xgen(x,ix),
         (select -1.5 + 0.031 * i, i from generate_series(0,101) as i) as ygen(y,iy)
    UNION ALL
    SELECT IX, IY, CX, CY, X * X - Y * Y + CX AS X, Y * X * 2 + CY, I + 1
    FROM Z
    WHERE X * X + Y * Y < 16::float
    AND I < 100
)
SELECT array_to_string(array_agg(SUBSTRING(' .,,,-----++++%%%%@@@@#### ', LEAST(GREATEST(I,1),27), 1)),'')
FROM (
    SELECT IX, IY, MAX(I) AS I
    FROM Z
    GROUP BY IY, IX
    ORDER BY IY, IX
) AS ZT
GROUP BY IY
ORDER BY IY
;

## heroku-pg-extras-ps.sql
-- view active queries with execution time
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
-- assumes pg >= 9.2
SELECT
  pid,
  application_name AS source,
  age(now(),query_start) AS running_for,
  waiting,
  query AS query
FROM pg_stat_activity
WHERE
  query <> '<insufficient privilege>'
  AND state <> 'idle'
  AND pid <> pg_backend_pid()
  ORDER BY query_start DESC
;

## heroku-pg-extras-seq_scans.sql
-- show the count of seq_scans by table descending by order
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
SELECT relname AS name, seq_scan as count
FROM pg_stat_user_tables
ORDER BY seq_scan DESC;

## heroku-pg-extras-total_index_size.sql
-- show the total size of all indexes in MB
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
SELECT pg_size_pretty(sum(relpages::bigint*8192)::bigint) AS size
FROM pg_class
WHERE reltype = 0;

## heroku-pg-extras-unused_indexes.sql
-- Show unused and almost unused indexes, ordered by their size relative to
-- the number of index scans. Exclude indexes of very small tables (less than
-- 5 pages), where the planner will almost invariably select a sequential
-- scan, but may not in the future as the table grows.
--
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
SELECT
  schemaname || '.' || relname AS table,
  indexrelname AS index,
  pg_size_pretty(pg_relation_size(i.indexrelid)) AS index_size,
  idx_scan as index_scans
FROM pg_stat_user_indexes ui
JOIN pg_index i ON ui.indexrelid = i.indexrelid
WHERE NOT indisunique AND idx_scan < 50 AND pg_relation_size(relid) > 5 * 8192
ORDER BY
  pg_relation_size(i.indexrelid) / nullif(idx_scan, 0) DESC NULLS FIRST,
  pg_relation_size(i.indexrelid) DESC
;

## heroku-pg-extras-vacuum_stats.sql
-- Show dead rows and whether an automatic vacuum is expected to be triggered
-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
WITH table_opts AS (
  SELECT
    pg_class.oid, relname, nspname, array_to_string(reloptions, '') AS relopts
  FROM
     pg_class INNER JOIN pg_namespace ns ON relnamespace = ns.oid
), vacuum_settings AS (
  SELECT
    oid, relname, nspname,
    CASE
      WHEN relopts LIKE '%autovacuum_vacuum_threshold%'
        THEN regexp_replace(relopts, '.*autovacuum_vacuum_threshold=([0-9.]+).*', E'\\\\\\1')::integer
        ELSE current_setting('autovacuum_vacuum_threshold')::integer
      END AS autovacuum_vacuum_threshold,
    CASE
      WHEN relopts LIKE '%autovacuum_vacuum_scale_factor%'
        THEN regexp_replace(relopts, '.*autovacuum_vacuum_scale_factor=([0-9.]+).*', E'\\\\\\1')::real
        ELSE current_setting('autovacuum_vacuum_scale_factor')::real
      END AS autovacuum_vacuum_scale_factor
  FROM
    table_opts
)
SELECT
  vacuum_settings.nspname AS schema,
  vacuum_settings.relname AS table,
  to_char(psut.last_vacuum, 'YYYY-MM-DD HH24:MI') AS last_vacuum,
  to_char(psut.last_autovacuum, 'YYYY-MM-DD HH24:MI') AS last_autovacuum,
  to_char(pg_class.reltuples, '9G999G999G999') AS rowcount,
  to_char(psut.n_dead_tup, '9G999G999G999') AS dead_rowcount,
  to_char(autovacuum_vacuum_threshold
       + (autovacuum_vacuum_scale_factor::numeric * pg_class.reltuples), '9G999G999G999') AS autovacuum_threshold,
  CASE
    WHEN autovacuum_vacuum_threshold + (autovacuum_vacuum_scale_factor::numeric * pg_class.reltuples) < psut.n_dead_tup
    THEN 'yes'
  END AS expect_autovacuum
FROM
  pg_stat_user_tables psut INNER JOIN pg_class ON psut.relid = pg_class.oid
    INNER JOIN vacuum_settings ON pg_class.oid = vacuum_settings.oid
ORDER BY 1
;
	-- show table and index bloat in your database ordered by most wasteful
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	WITH constants AS (
	SELECT current_setting('block_size')::numeric AS bs, 23 AS hdr, 4 AS ma
	), bloat_info AS (
	SELECT
	ma,bs,schemaname,tablename,
	(datawidth+(hdr+ma-(case when hdr%ma=0 THEN ma ELSE hdr%ma END)))::numeric AS datahdr,
	(maxfracsum*(nullhdr+ma-(case when nullhdr%ma=0 THEN ma ELSE nullhdr%ma END))) AS nullhdr2
	FROM (
	SELECT
	schemaname, tablename, hdr, ma, bs,
	SUM((1-null_frac)*avg_width) AS datawidth,
	MAX(null_frac) AS maxfracsum,
	hdr+(
	SELECT 1+count(*)/8
	FROM pg_stats s2
	WHERE null_frac<>0 AND s2.schemaname = s.schemaname AND s2.tablename = s.tablename
	) AS nullhdr
	FROM pg_stats s, constants
	GROUP BY 1,2,3,4,5
	) AS foo
	), table_bloat AS (
	SELECT
	schemaname, tablename, cc.relpages, bs,
	CEIL((cc.reltuples*((datahdr+ma-
	(CASE WHEN datahdr%ma=0 THEN ma ELSE datahdr%ma END))+nullhdr2+4))/(bs-20::float)) AS otta
	FROM bloat_info
	JOIN pg_class cc ON cc.relname = bloat_info.tablename
	JOIN pg_namespace nn ON cc.relnamespace = nn.oid AND nn.nspname = bloat_info.schemaname AND nn.nspname <> 'information_schema'
	), index_bloat AS (
	SELECT
	schemaname, tablename, bs,
	COALESCE(c2.relname,'?') AS iname, COALESCE(c2.reltuples,0) AS ituples, COALESCE(c2.relpages,0) AS ipages,
	COALESCE(CEIL((c2.reltuples*(datahdr-12))/(bs-20::float)),0) AS iotta -- very rough approximation, assumes all cols
	FROM bloat_info
	JOIN pg_class cc ON cc.relname = bloat_info.tablename
	JOIN pg_namespace nn ON cc.relnamespace = nn.oid AND nn.nspname = bloat_info.schemaname AND nn.nspname <> 'information_schema'
	JOIN pg_index i ON indrelid = cc.oid
	JOIN pg_class c2 ON c2.oid = i.indexrelid
	)
	SELECT
	type, schemaname, object_name, bloat, pg_size_pretty(raw_waste) as waste
	FROM (
	SELECT
	'table' as type,
	schemaname,
	tablename as object_name,
	ROUND(CASE WHEN otta=0 THEN 0.0 ELSE table_bloat.relpages/otta::numeric END,1) AS bloat,
	CASE WHEN relpages < otta THEN '0' ELSE (bs*(table_bloat.relpages-otta)::bigint)::bigint END AS raw_waste
	FROM table_bloat
	UNION
	SELECT
	'index' as type,
	schemaname,
	tablename \|\| '::' \|\| iname as object_name,
	ROUND(CASE WHEN iotta=0 OR ipages=0 THEN 0.0 ELSE ipages/iotta::numeric END,1) AS bloat,
	CASE WHEN ipages < iotta THEN '0' ELSE (bs*(ipages-iotta))::bigint END AS raw_waste
	FROM index_bloat
	) bloat_summary
	ORDER BY raw_waste DESC, bloat DESC
	;
	-- display queries holding locks other queries are waiting to be released
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	-- assumes pg >= 9.2
	SELECT bl.pid AS blocked_pid,
	ka.query AS blocking_statement,
	now() - ka.query_start AS blocking_duration,
	kl.pid AS blocking_pid,
	a.query AS blocked_statement,
	now() - a.query_start AS blocked_duration
	FROM pg_catalog.pg_locks bl
	JOIN pg_catalog.pg_stat_activity a
	ON bl.pid = a.pid
	JOIN pg_catalog.pg_locks kl
	JOIN pg_catalog.pg_stat_activity ka
	ON kl.pid = ka.pid
	ON bl.transactionid = kl.transactionid AND bl.pid != kl.pid
	WHERE NOT bl.granted
	-- calculates your cache hit rate (effective databases are at 99% and up)
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	SELECT
	'index hit rate' AS name,
	(sum(idx_blks_hit)) / sum(idx_blks_hit + idx_blks_read) AS ratio
	FROM pg_statio_user_indexes
	UNION ALL
	SELECT
	'cache hit rate' AS name,
	sum(heap_blks_hit) / (sum(heap_blks_hit) + sum(heap_blks_read)) AS ratio
	FROM pg_statio_user_tables;
	-- show the size of indexes, descending by size
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	SELECT relname AS name,
	pg_size_pretty(sum(relpages::bigint*8192)::bigint) AS size
	FROM pg_class
	WHERE reltype = 0
	GROUP BY relname
	ORDER BY sum(relpages) DESC;
	-- calculates your index hit rate (effective databases are at 99% and up)
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	SELECT relname,
	CASE idx_scan
	WHEN 0 THEN 'Insufficient data'
	ELSE (100 * idx_scan / (seq_scan + idx_scan))::text
	END percent_of_times_index_used,
	n_live_tup rows_in_table
	FROM
	pg_stat_user_tables
	ORDER BY
	n_live_tup DESC;
	-- terminates ALL connections
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	-- assumes pg >= 9.2
	SELECT pg_terminate_backend(pid)
	FROM pg_stat_activity
	WHERE pid <> pg_backend_pid()
	AND query <> '<insufficient privilege>'
	;
	-- display queries with active locks
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	-- assumes pg >= 9.2
	SELECT
	pg_stat_activity.pid,
	pg_class.relname,
	pg_locks.transactionid,
	pg_locks.granted,
	substr(pg_stat_activity.query,1,30) AS query_snippet,
	age(now(),pg_stat_activity.query_start) AS "age"
	FROM pg_stat_activity,pg_locks left
	OUTER JOIN pg_class
	ON (pg_locks.relation = pg_class.oid)
	WHERE pg_stat_activity.query <> '<insufficient privilege>'
	AND pg_locks.pid = pg_stat_activity.pid
	AND pg_locks.mode = 'ExclusiveLock' order by query_start;
	-- show all queries taking longer than five minutes ordered by duration descending
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	-- assumes pg >= 9.2
	SELECT
	pid,
	now() - pg_stat_activity.query_start AS duration,
	query AS query
	FROM
	pg_stat_activity
	WHERE
	pg_stat_activity.query <> ''::text
	AND state <> 'idle'
	AND now() - pg_stat_activity.query_start > interval '5 minutes'
	ORDER BY
	now() - pg_stat_activity.query_start DESC
	;
	-- show the mandelbrot set
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	WITH RECURSIVE Z(IX, IY, CX, CY, X, Y, I) AS (
	SELECT IX, IY, X::float, Y::float, X::float, Y::float, 0
	FROM (select -2.2 + 0.031 * i, i from generate_series(0,101) as i) as xgen(x,ix),
	(select -1.5 + 0.031 * i, i from generate_series(0,101) as i) as ygen(y,iy)
	UNION ALL
	SELECT IX, IY, CX, CY, X * X - Y * Y + CX AS X, Y * X * 2 + CY, I + 1
	FROM Z
	WHERE X * X + Y * Y < 16::float
	AND I < 100
	)
	SELECT array_to_string(array_agg(SUBSTRING(' .,,,-----++++%%%%@@@@#### ', LEAST(GREATEST(I,1),27), 1)),'')
	FROM (
	SELECT IX, IY, MAX(I) AS I
	FROM Z
	GROUP BY IY, IX
	ORDER BY IY, IX
	) AS ZT
	GROUP BY IY
	ORDER BY IY
	;
	-- view active queries with execution time
	-- https://github.com/heroku/heroku-pg-extras/blob/master/init.rb
	-- assumes pg >= 9.2
	SELECT
	pid,
	application_name AS source,
	age(now(),query_start) AS running_for,
	waiting,
	query AS query
	FROM pg_stat_activity
	WHERE
	query <> '<insufficient privilege>'
	AND state <> 'idle'
	AND pid <> pg_backend_pid()
	ORDER BY query_start DESC
	;