bloat estimation

NikolayS · NikolayS · commit 64adbf8d108e · 2017-12-24T23:33:23.000+03:00
diff --git a/bloat/btree_estimation.sql b/bloat/btree_estimation.sql
@@ -0,0 +1,96 @@
+-- enhanced version of https://github.com/ioguix/pgsql-bloat-estimation/blob/master/btree/btree_bloat.sql
+
+-- WARNING: executed with a non-superuser role, the query inspect only index on tables you are granted to read.
+-- WARNING: rows with is_na = 't' are known to have bad statistics ("name" type is not supported).
+-- This query is compatible with PostgreSQL 8.2 and after
+
+ with data as (
+  SELECT current_database(), nspname AS schemaname, tblname, idxname, bs*(relpages)::bigint AS real_size,
+    bs*(relpages-est_pages)::bigint AS extra_size,
+    100 * (relpages-est_pages)::float / relpages AS extra_ratio,
+    fillfactor, bs*(relpages-est_pages_ff) AS bloat_size,
+    100 * (relpages-est_pages_ff)::float / relpages AS bloat_ratio,
+    is_na
+    -- , 100-(sub.pst).avg_leaf_density, est_pages, index_tuple_hdr_bm, maxalign, pagehdr, nulldatawidth, nulldatahdrwidth, sub.reltuples, sub.relpages -- (DEBUG INFO)
+  FROM (
+    SELECT coalesce(1 +
+         ceil(reltuples/floor((bs-pageopqdata-pagehdr)/(4+nulldatahdrwidth)::float)), 0 -- ItemIdData size + computed avg size of a tuple (nulldatahdrwidth)
+      ) AS est_pages,
+      coalesce(1 +
+         ceil(reltuples/floor((bs-pageopqdata-pagehdr)*fillfactor/(100*(4+nulldatahdrwidth)::float))), 0
+      ) AS est_pages_ff,
+      bs, nspname, table_oid, tblname, idxname, relpages, fillfactor, is_na
+      -- , stattuple.pgstatindex(quote_ident(nspname)||'.'||quote_ident(idxname)) AS pst, index_tuple_hdr_bm, maxalign, pagehdr, nulldatawidth, nulldatahdrwidth, reltuples -- (DEBUG INFO)
+    FROM (
+      SELECT maxalign, bs, nspname, tblname, idxname, reltuples, relpages, relam, table_oid, fillfactor,
+        ( index_tuple_hdr_bm +
+            maxalign - CASE -- Add padding to the index tuple header to align on MAXALIGN
+              WHEN index_tuple_hdr_bm%maxalign = 0 THEN maxalign
+              ELSE index_tuple_hdr_bm%maxalign
+            END
+          + nulldatawidth + maxalign - CASE -- Add padding to the data to align on MAXALIGN
+              WHEN nulldatawidth = 0 THEN 0
+              WHEN nulldatawidth::integer%maxalign = 0 THEN maxalign
+              ELSE nulldatawidth::integer%maxalign
+            END
+        )::numeric AS nulldatahdrwidth, pagehdr, pageopqdata, is_na
+        -- , index_tuple_hdr_bm, nulldatawidth -- (DEBUG INFO)
+      FROM (
+        SELECT
+          i.nspname, i.tblname, i.idxname, i.reltuples, i.relpages, i.relam, a.attrelid AS table_oid,
+          current_setting('block_size')::numeric AS bs, fillfactor,
+          CASE -- MAXALIGN: 4 on 32bits, 8 on 64bits (and mingw32 ?)
+            WHEN version() ~ 'mingw32' OR version() ~ '64-bit|x86_64|ppc64|ia64|amd64' THEN 8
+            ELSE 4
+          END AS maxalign,
+          /* per page header, fixed size: 20 for 7.X, 24 for others */
+          24 AS pagehdr,
+          /* per page btree opaque data */
+          16 AS pageopqdata,
+          /* per tuple header: add IndexAttributeBitMapData if some cols are null-able */
+          CASE WHEN max(coalesce(s.null_frac,0)) = 0
+            THEN 2 -- IndexTupleData size
+            ELSE 2 + (( 32 + 8 - 1 ) / 8) -- IndexTupleData size + IndexAttributeBitMapData size ( max num filed per index + 8 - 1 /8)
+          END AS index_tuple_hdr_bm,
+          /* data len: we remove null values save space using it fractionnal part from stats */
+          sum( (1-coalesce(s.null_frac, 0)) * coalesce(s.avg_width, 1024)) AS nulldatawidth,
+          max( CASE WHEN a.atttypid = 'pg_catalog.name'::regtype THEN 1 ELSE 0 END ) > 0 AS is_na
+        FROM pg_attribute AS a
+          JOIN (
+            SELECT nspname, tbl.relname AS tblname, idx.relname AS idxname, idx.reltuples, idx.relpages, idx.relam,
+              indrelid, indexrelid, indkey::smallint[] AS attnum,
+              coalesce(substring(
+                array_to_string(idx.reloptions, ' ')
+                 from 'fillfactor=([0-9]+)')::smallint, 90) AS fillfactor
+            FROM pg_index
+              JOIN pg_class idx ON idx.oid=pg_index.indexrelid
+              JOIN pg_class tbl ON tbl.oid=pg_index.indrelid
+              JOIN pg_namespace ON pg_namespace.oid = idx.relnamespace
+            WHERE pg_index.indisvalid AND tbl.relkind = 'r' AND idx.relpages > 0
+          ) AS i ON a.attrelid = i.indexrelid
+          JOIN pg_stats AS s ON s.schemaname = i.nspname
+            AND ((s.tablename = i.tblname AND s.attname = pg_catalog.pg_get_indexdef(a.attrelid, a.attnum, TRUE)) -- stats from tbl
+            OR   (s.tablename = i.idxname AND s.attname = a.attname))-- stats from functionnal cols
+          JOIN pg_type AS t ON a.atttypid = t.oid
+        WHERE a.attnum > 0
+        GROUP BY 1, 2, 3, 4, 5, 6, 7, 8, 9
+      ) AS s1
+    ) AS s2
+      JOIN pg_am am ON s2.relam = am.oid WHERE am.amname = 'btree'
+  ) AS sub
+  -- WHERE NOT is_na
+)
+select
+  current_database, schemaname, tblname, idxname,
+  real_size, pg_size_pretty(real_size::numeric) as real_size_pretty,
+  extra_size, pg_size_pretty(extra_size::numeric) as extra_size_pretty,
+  extra_ratio as "extra_ratio, %",
+  bloat_size, pg_size_pretty(bloat_size::numeric) as bloat_size_pretty,
+  bloat_ratio as "bloat_ratio, %",
+  fillfactor,
+  is_na,
+  real_size - bloat_size as live_data_size
+from data
+order by bloat_size desc
+;
+
diff --git a/bloat/index_pgstattuple.sql b/bloat/index_pgstattuple.sql
@@ -0,0 +1,31 @@
+--https://github.com/dataegret/pg-utils/tree/master/sql
+--pgstattuple extension required
+--WARNING: without index name/mask query will read all available indexes which could cause I/O spikes
+with indexes as (
+    select * from pg_stat_user_indexes
+)
+select schemaname,
+table_name,
+pg_size_pretty(table_size) as table_size,
+index_name,
+pg_size_pretty(index_size) as index_size,
+idx_scan as index_scans,
+round((free_space*100/index_size)::numeric, 1) as waste_percent,
+pg_size_pretty(free_space) as waste
+from (
+    select schemaname, p.relname as table_name, indexrelname as index_name,
+    (select (case when avg_leaf_density = 'NaN' then 0 
+        else greatest(ceil(index_size * (1 - avg_leaf_density / (coalesce((SELECT (regexp_matches(reloptions::text, E'.*fillfactor=(\\d+).*'))[1]),'90')::real)))::bigint, 0) end)
+        from pgstatindex(schemaname || '.' || p.indexrelid::regclass::text)
+    ) as free_space,
+    pg_relation_size(p.indexrelid) as index_size,
+    pg_relation_size(p.relid) as table_size,
+    idx_scan
+    from indexes p
+    join pg_class c on p.indexrelid = c.oid
+    where pg_get_indexdef(p.indexrelid) like '%USING btree%' and
+    --put your index name/mask here
+    indexrelname ~ ''
+) t
+order by free_space desc;
+
diff --git a/bloat/table_estimation.sql b/bloat/table_estimation.sql
@@ -0,0 +1,74 @@
+-- enhanced version of https://github.com/ioguix/pgsql-bloat-estimation/blob/master/table/table_bloat.sql
+
+/* WARNING: executed with a non-superuser role, the query inspect only tables you are granted to read.
+* This query is compatible with PostgreSQL 9.0 and more
+*/
+
+with data as (
+  SELECT current_database(), schemaname, tblname, bs*tblpages AS real_size, 
+    (tblpages-est_tblpages)*bs AS extra_size,
+    CASE WHEN tblpages - est_tblpages > 0
+      THEN 100 * (tblpages - est_tblpages)/tblpages::float
+      ELSE 0
+    END AS extra_ratio, fillfactor, (tblpages-est_tblpages_ff)*bs AS bloat_size,
+    CASE WHEN tblpages - est_tblpages_ff > 0
+      THEN 100 * (tblpages - est_tblpages_ff)/tblpages::float
+      ELSE 0
+    END AS bloat_ratio, is_na
+    -- , (pst).free_percent + (pst).dead_tuple_percent AS real_frag
+  FROM (
+    SELECT ceil( reltuples / ( (bs-page_hdr)/tpl_size ) ) + ceil( toasttuples / 4 ) AS est_tblpages,
+      ceil( reltuples / ( (bs-page_hdr)*fillfactor/(tpl_size*100) ) ) + ceil( toasttuples / 4 ) AS est_tblpages_ff,
+      tblpages, fillfactor, bs, tblid, schemaname, tblname, heappages, toastpages, is_na
+      -- , stattuple.pgstattuple(tblid) AS pst
+    FROM (
+    SELECT
+        ( 4 + tpl_hdr_size + tpl_data_size + (2*ma)
+            - CASE WHEN tpl_hdr_size%ma = 0 THEN ma ELSE tpl_hdr_size%ma END
+          - CASE WHEN ceil(tpl_data_size)::int%ma = 0 THEN ma ELSE ceil(tpl_data_size)::int%ma END
+        ) AS tpl_size, bs - page_hdr AS size_per_block, (heappages + toastpages) AS tblpages, heappages,
+        toastpages, reltuples, toasttuples, bs, page_hdr, tblid, schemaname, tblname, fillfactor, is_na
+      FROM (
+        SELECT
+          tbl.oid AS tblid, ns.nspname AS schemaname, tbl.relname AS tblname, tbl.reltuples,
+          tbl.relpages AS heappages, coalesce(toast.relpages, 0) AS toastpages,
+          coalesce(toast.reltuples, 0) AS toasttuples,
+          coalesce(substring(
+            array_to_string(tbl.reloptions, ' ')
+            FROM '%fillfactor=#"__#"%' FOR '#')::smallint, 100) AS fillfactor,
+          current_setting('block_size')::numeric AS bs,
+          CASE WHEN version()~'mingw32' OR version()~'64-bit|x86_64|ppc64|ia64|amd64' THEN 8 ELSE 4 END AS ma,
+          24 AS page_hdr,
+          23 + CASE WHEN MAX(coalesce(null_frac,0)) > 0 THEN ( 7 + count(*) ) / 8 ELSE 0::int END
+             + CASE WHEN tbl.relhasoids THEN 4 ELSE 0 END AS tpl_hdr_size,
+         sum( (1-coalesce(s.null_frac, 0)) * coalesce(s.avg_width, 1024) ) AS tpl_data_size,
+          bool_or(att.atttypid = 'pg_catalog.name'::regtype) AS is_na
+        FROM pg_attribute AS att
+          JOIN pg_class AS tbl ON att.attrelid = tbl.oid
+          JOIN pg_namespace AS ns ON ns.oid = tbl.relnamespace
+          JOIN pg_stats AS s ON s.schemaname=ns.nspname
+            AND s.tablename = tbl.relname AND s.inherited=false AND s.attname=att.attname
+          LEFT JOIN pg_class AS toast ON tbl.reltoastrelid = toast.oid
+        WHERE att.attnum > 0 AND NOT att.attisdropped
+          AND tbl.relkind = 'r'
+        GROUP BY 1,2,3,4,5,6,7,8,9,10, tbl.relhasoids
+        ORDER BY 2,3
+      ) AS s
+    ) AS s2
+  ) AS s3
+  -- WHERE NOT is_na
+  --   AND tblpages*((pst).free_percent + (pst).dead_tuple_percent)::float4/100 >= 1
+)
+select current_database, schemaname, tblname,
+   real_size, pg_size_pretty(real_size::numeric) as real_size_pretty,
+   extra_size, pg_size_pretty(extra_size::numeric) as extra_size_pretty,
+   extra_ratio as "extra_ratio, %",
+   bloat_size, pg_size_pretty(bloat_size::numeric) as bloat_size_pretty,
+   bloat_ratio as "bloat_ratio, %",
+   fillfactor,
+   is_na,
+   real_size - bloat_size as live_data_size
+from data
+order by bloat_size desc
+;
+
diff --git a/bloat/table_pgstattuple.sql b/bloat/table_pgstattuple.sql
@@ -0,0 +1,28 @@
+--https://github.com/dataegret/pg-utils/tree/master/sql
+--pgstattuple extension required
+--WARNING: without table name/mask query will read all available tables which could cause I/O spikes
+select nspname,
+relname,
+pg_size_pretty(relation_size + toast_relation_size) as total_size,
+pg_size_pretty(toast_relation_size) as toast_size,
+round(((relation_size - (relation_size - free_space)*100/fillfactor)*100/greatest(relation_size, 1))::numeric, 1) table_waste_percent,
+pg_size_pretty((relation_size - (relation_size - free_space)*100/fillfactor)::bigint) table_waste,
+round(((toast_free_space + relation_size - (relation_size - free_space)*100/fillfactor)*100/greatest(relation_size + toast_relation_size, 1))::numeric, 1) total_waste_percent,
+pg_size_pretty((toast_free_space + relation_size - (relation_size - free_space)*100/fillfactor)::bigint) total_waste
+from (
+    select nspname, relname,
+    (select free_space from pgstattuple(c.oid)) as free_space,
+    pg_relation_size(c.oid) as relation_size,
+    (case when reltoastrelid = 0 then 0 else (select free_space from pgstattuple(c.reltoastrelid)) end) as toast_free_space,
+    coalesce(pg_relation_size(c.reltoastrelid), 0) as toast_relation_size,
+    coalesce((SELECT (regexp_matches(reloptions::text, E'.*fillfactor=(\\d+).*'))[1]),'100')::real AS fillfactor
+    from pg_class c
+    left join pg_namespace n on (n.oid = c.relnamespace)
+    where nspname not in ('pg_catalog', 'information_schema')
+    and nspname !~ '^pg_toast' and relkind = 'r'
+    --put your table name/mask here
+    and relname ~ ''
+) t
+order by (toast_free_space + relation_size - (relation_size - free_space)*100/fillfactor) desc
+limit 20;
+
diff --git a/start.psql b/start.psql
@@ -1,17 +1,25 @@
 \echo Menu:
 \echo '   1  – Basic Node Information (master/replica, lag, DB size, tmp files)'
-\echo '   2  – ....'
+\echo '   2  – Sizes of tables'
+\echo '  b1  – Table bloat, rough estimation'
+\echo '  b2  – B-tree indexes bloat, rough estimation'
+\echo '  b3  – Table bloat, more precise (requires pgstattuple extension; expensive)'
+\echo '  b4  – Index bloat, more precise (requires pgstattuple extension; expensive)'
 \echo '   3  - Slowest Queries'
 \echo '  i1  - Unused/Redundant Indexes'
 \echo '  i2  - Rarely Used Indexes'
-\echo '   q  – Quit from this tool'
+\echo '   q  – Quit'
 \echo
 \echo 'Type your choice and press <Enter>:'
 \prompt d_step_unq
 \set d_stp '\'' :d_step_unq '\''
 select
   :d_stp::text = '1' as d_step_is_1,
   :d_stp::text = '2' as d_step_is_2,
+  :d_stp::text = 'b1' as d_step_is_b1,
+  :d_stp::text = 'b2' as d_step_is_b2,
+  :d_stp::text = 'b3' as d_step_is_b3,
+  :d_stp::text = 'b4' as d_step_is_b4,
   :d_stp::text = '3' as d_step_is_3,
   :d_stp::text = 'i1' as d_step_is_i1,
   :d_stp::text = 'i2' as d_step_is_i2,
@@ -24,6 +32,22 @@ select
   \echo '      2 is chosen!'
   \prompt 'Press <Enter> to continue…' d_dummy
   \i ./start.psql
+\elif :d_step_is_b1
+  \i ./bloat/table_estimation.sql
+  \prompt 'Press <Enter> to continue…' d_dummy
+  \i ./start.psql
+\elif :d_step_is_b2
+  \i ./bloat/btree_estimation.sql
+  \prompt 'Press <Enter> to continue…' d_dummy
+  \i ./start.psql
+\elif :d_step_is_b3
+  \i ./bloat/table_pgstattuple.sql
+  \prompt 'Press <Enter> to continue…' d_dummy
+  \i ./start.psql
+\elif :d_step_is_b4
+  \i ./bloat/index_pgstattuple.sql
+  \prompt 'Press <Enter> to continue…' d_dummy
+  \i ./start.psql
 \elif :d_step_is_3
   \echo '      3 is chosen!'
   \prompt 'Press <Enter> to continue…' d_dummy