5033 fk indexing round2 (#5040)

* updated query to find more results and be simpler

* updating query in fhir

---------

Co-authored-by: leif stawnyczy <leifstawnyczy@leifs-mbp.home>
This commit is contained in:
TipzCM 2023-06-28 15:37:45 -04:00 committed by GitHub
parent 17eeb07c58
commit ce04e897cf
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
2 changed files with 54 additions and 148 deletions

View File

@ -0,0 +1,8 @@
---
type: fix
issue: 5033
title: "
Updated the query that is supposed to help detect foreign key constraints
that also do not have indexes to be a) simpler (smaller) and b) find more results.
Added an additional entry to the whitelist as a result.
"

View File

@ -22,7 +22,6 @@ package ca.uhn.fhir.jpa.embedded;
import com.google.common.collect.HashMultimap; import com.google.common.collect.HashMultimap;
import com.google.common.collect.Multimap; import com.google.common.collect.Multimap;
import org.intellij.lang.annotations.Language; import org.intellij.lang.annotations.Language;
import org.postgresql.jdbc.PgArray;
import org.slf4j.Logger; import org.slf4j.Logger;
import org.slf4j.LoggerFactory; import org.slf4j.LoggerFactory;
@ -57,137 +56,41 @@ public class HapiForeignKeyIndexHelper {
@Language("SQL") @Language("SQL")
private static final String FK_QUERY = """ private static final String FK_QUERY = """
WITH fk_actions ( code, action ) AS ( SELECT c.conrelid::regclass AS "table",
VALUES ( 'a', 'error' ), /* list of key column names in order */
( 'r', 'restrict' ), string_agg(a.attname, ',' ORDER BY x.n) AS columns,
( 'c', 'cascade' ), pg_catalog.pg_size_pretty(
( 'n', 'set null' ), pg_catalog.pg_relation_size(c.conrelid)
( 'd', 'set default' ) ) AS size,
), c.conname AS constraint,
fk_list AS ( c.confrelid::regclass AS referenced_table
SELECT pg_constraint.oid as fkoid, conrelid, confrelid as parentid, FROM pg_catalog.pg_constraint c
conname, relname, nspname, /* enumerated key column numbers per foreign key */
fk_actions_update.action as update_action, CROSS JOIN LATERAL
fk_actions_delete.action as delete_action, unnest(c.conkey) WITH ORDINALITY AS x(attnum, n)
conkey as key_cols /* name for each key column */
FROM pg_constraint JOIN pg_catalog.pg_attribute a
JOIN pg_class ON conrelid = pg_class.oid ON a.attnum = x.attnum
JOIN pg_namespace ON pg_class.relnamespace = pg_namespace.oid AND a.attrelid = c.conrelid
JOIN fk_actions AS fk_actions_update ON confupdtype = fk_actions_update.code WHERE NOT EXISTS
JOIN fk_actions AS fk_actions_delete ON confdeltype = fk_actions_delete.code /* is there a matching index for the constraint? */
WHERE contype = 'f' (SELECT 1 FROM pg_catalog.pg_index i
-- unique keys are indexed by default; so exclude any UNIQUE column constraints WHERE i.indrelid = c.conrelid
AND not (conkey = any(select conkey from pg_constraint where contype = 'u')) /* it must not be a partial index */
), AND i.indpred IS NULL
fk_attributes AS ( /* the first index columns must be the same as the
SELECT fkoid, conrelid, attname, attnum key columns, but order doesn't matter */
FROM fk_list AND (i.indkey::smallint[])[0:cardinality(c.conkey)-1]
JOIN pg_attribute OPERATOR(pg_catalog.@>) c.conkey)
ON conrelid = attrelid AND c.contype = 'f'
AND attnum = ANY( key_cols ) GROUP BY c.conrelid, c.conname, c.confrelid
ORDER BY fkoid, attnum ORDER BY pg_catalog.pg_relation_size(c.conrelid) DESC;
), """;
fk_cols_list AS (
SELECT fkoid, array_agg(attname) as cols_list
FROM fk_attributes
GROUP BY fkoid
),
index_list AS (
SELECT indexrelid as indexid,
pg_class.relname as indexname,
indrelid,
indkey,
indpred is not null as has_predicate,
pg_get_indexdef(indexrelid) as indexdef
FROM pg_index
JOIN pg_class ON indexrelid = pg_class.oid
WHERE indisvalid
),
fk_index_match AS (
SELECT fk_list.*,
indexid,
indexname,
indkey::int[] as indexatts,
has_predicate,
indexdef,
array_length(key_cols, 1) as fk_colcount,
array_length(indkey,1) as index_colcount,
round(pg_relation_size(conrelid)/(1024^2)::numeric) as table_mb,
cols_list
FROM fk_list
JOIN fk_cols_list USING (fkoid)
LEFT OUTER JOIN index_list
ON conrelid = indrelid
AND (indkey::int2[])[0:(array_length(key_cols,1) -1)] @> key_cols
),
fk_perfect_match AS (
SELECT fkoid
FROM fk_index_match
WHERE (index_colcount - 1) <= fk_colcount
AND NOT has_predicate
AND indexdef LIKE '%USING btree%'
),
fk_index_check AS (
SELECT 'no index' as issue, *, 1 as issue_sort
FROM fk_index_match
WHERE indexid IS NULL
UNION ALL
SELECT 'questionable index' as issue, *, 2
FROM fk_index_match
WHERE indexid IS NOT NULL
AND fkoid NOT IN (
SELECT fkoid
FROM fk_perfect_match)
),
parent_table_stats AS (
SELECT fkoid, tabstats.relname as parent_name,
(n_tup_ins + n_tup_upd + n_tup_del + n_tup_hot_upd) as parent_writes,
round(pg_relation_size(parentid)/(1024^2)::numeric) as parent_mb
FROM pg_stat_user_tables AS tabstats
JOIN fk_list
ON relid = parentid
),
fk_table_stats AS (
SELECT fkoid,
(n_tup_ins + n_tup_upd + n_tup_del + n_tup_hot_upd) as writes,
seq_scan as table_scans
FROM pg_stat_user_tables AS tabstats
JOIN fk_list
ON relid = conrelid
)
SELECT nspname as schema_name,
relname as table_name,
conname as fk_name,
issue,
table_mb,
writes,
table_scans,
parent_name,
parent_mb,
parent_writes,
cols_list,
indexdef
FROM fk_index_check
JOIN parent_table_stats USING (fkoid)
JOIN fk_table_stats USING (fkoid)
WHERE issue = 'no index'
ORDER BY issue_sort, table_mb DESC, table_name, fk_name;
""";
// columns
private static final String TABLE_NAME = "table_name";
private static final String FK_NAME = "fk_name";
private static final String PARENT_TABLE_NAME = "parent_name";
private static final String COLS_LIST = "cols_list";
private static final String ISSUE = "issue";
private static final Logger ourLog = LoggerFactory.getLogger(HapiForeignKeyIndexHelper.class); private static final Logger ourLog = LoggerFactory.getLogger(HapiForeignKeyIndexHelper.class);
protected static final Multimap<String, String> ourTableToColumnsWhitelist = HashMultimap.create(); protected static final Multimap<String, String> ourTableToColumnsWhitelist = HashMultimap.create();
private static final String MESSAGE = "\nUnindexed foreign key detected!\nTable: %s, Column: %s, FKIndex Name: %s, Parent Table: %s, Issue: %s";
public HapiForeignKeyIndexHelper() { public HapiForeignKeyIndexHelper() {
populateWhiteList(); populateWhiteList();
} }
@ -209,6 +112,9 @@ public class HapiForeignKeyIndexHelper {
// TODO - LS - entries below here require further investigation // TODO - LS - entries below here require further investigation
// MPI_LINK_AID - autogenerated table // MPI_LINK_AID - autogenerated table
ourTableToColumnsWhitelist.put("MPI_LINK_AUD", "REV"); ourTableToColumnsWhitelist.put("MPI_LINK_AUD", "REV");
// hfj_history_tag - tag_id - do we ever delete by tag history by tag_id (or at all)?
ourTableToColumnsWhitelist.put("HFJ_HISTORY_TAG", "TAG_ID");
} }
public void ensureAllForeignKeysAreIndexed(DataSource theDataSource) throws SQLException { public void ensureAllForeignKeysAreIndexed(DataSource theDataSource) throws SQLException {
@ -217,31 +123,23 @@ public class HapiForeignKeyIndexHelper {
ResultSet results = statement.executeQuery(FK_QUERY); ResultSet results = statement.executeQuery(FK_QUERY);
while (results.next()) { while (results.next()) {
PgArray postgresArray = (PgArray) results.getArray(COLS_LIST); String tableName = results.getString("table").toUpperCase();
String[] columns = (String[]) postgresArray.getArray(); String columns = results.getString("columns").toUpperCase();
String tableName = results.getString(TABLE_NAME); String constraint = results.getString("constraint").toUpperCase();
String fkConstraintName = results.getString(FK_NAME); String referenced_table = results.getString("referenced_table").toUpperCase();
String parentTableName = results.getString(PARENT_TABLE_NAME);
String issue = results.getString(ISSUE);
Collection<String> whitelistColumns = ourTableToColumnsWhitelist.get(tableName.toUpperCase()); ourLog.warn(String.format("Table %s, Columns %s, Constraint %s, Referenced Table %s", tableName, columns, constraint, referenced_table));
for (String col : columns) {
boolean isWhitelisted = whitelistColumns.contains(col.toUpperCase()); Collection<String> whiteListColumns = ourTableToColumnsWhitelist.get(tableName);
if (!isWhitelisted) { boolean isWhiteListed = whiteListColumns.contains(columns);
ourLog.error(String.format(MESSAGE,
tableName, assertTrue(isWhiteListed,
col, String.format("Unindexed foreign key detected! Table.column: %s.%s. Constraint: %s", tableName, columns, constraint)
fkConstraintName, );
parentTableName,
issue));
}
assertTrue(isWhitelisted,
String.format("Unindexed foreign key detected! Table.column: %s.%s.", tableName, col)
);
}
} }
} }
} }
} }
} }