diff --git a/postgres/changelog.d/19294.added b/postgres/changelog.d/19294.added new file mode 100644 index 0000000000000..1382b5fc2e907 --- /dev/null +++ b/postgres/changelog.d/19294.added @@ -0,0 +1 @@ +Added `postgresql.sequence.estimated_remaining` metric for monitoring remaining available values in sequences \ No newline at end of file diff --git a/postgres/datadog_checks/postgres/metadata.py b/postgres/datadog_checks/postgres/metadata.py index 09fd16752b992..7e9d5126a3293 100644 --- a/postgres/datadog_checks/postgres/metadata.py +++ b/postgres/datadog_checks/postgres/metadata.py @@ -21,7 +21,7 @@ from datadog_checks.postgres.util import get_list_chunks from .util import payload_pg_version -from .version_utils import VersionUtils +from .version_utils import V13, VersionUtils # default collection intervals in seconds DEFAULT_SETTINGS_COLLECTION_INTERVAL = 600 @@ -181,6 +181,28 @@ GROUP BY pi.inhparent; """ +PG_SEQUENCES_QUERY = """ +SELECT (stavalues1::text::bigint[])[array_upper(stavalues1::text::bigint[],1)] as current_value, +pg_attribute.attname AS column_name, +power(2, attlen * 8 - 1) - 1 as max_value, +t.relname AS table_name, +nsp.nspname AS schema_name +FROM pg_attribute +INNER JOIN pg_attrdef + ON adrelid = attrelid AND adnum = attnum AND pg_get_expr(adbin, adrelid) like 'nextval%' +INNER JOIN pg_class t ON attrelid = t.oid +INNER JOIN pg_namespace nsp ON t.relnamespace = nsp.oid AND relnamespace IN + (SELECT nsp.oid FROM pg_namespace nsp + LEFT JOIN pg_roles r on nsp.nspowner = r.oid + WHERE nspname NOT IN ( 'information_schema', 'pg_catalog' ) + AND nspname NOT LIKE 'pg_toast%' + AND nspname NOT LIKE 'pg_temp_%' + AND r.rolname != 'rds_superuser' + AND r.rolname != 'rdsadmin' + ) + INNER JOIN pg_statistic on attrelid = starelid AND attnum = staattnum; +""" + def agent_check_getter(self): return self._check @@ -313,6 +335,9 @@ def _collect_postgres_schemas(self): for database in schema_metadata: dbname = database["name"] + + self.collect_sequences(dbname) + if not self._should_collect_metadata(dbname, "database"): continue @@ -701,3 +726,32 @@ def _collect_postgres_settings(self): rows = cursor.fetchall() self._log.debug("Loaded %s rows from pg_settings", len(rows)) return [dict(row) for row in rows] + + @tracked_method(agent_check_getter=agent_check_getter) + def collect_sequences(self, dbname): + if self._check.version < V13: + # pg_sequence was introduced in Postgres 13 + return + with self.db_pool.get_connection(dbname, self._config.idle_connection_timeout) as conn: + with conn.cursor(cursor_factory=psycopg2.extras.DictCursor) as cursor: + cursor.execute(PG_SEQUENCES_QUERY) + rows = cursor.fetchall() + # Emit a single gauge for each sequence + for row in rows: + if row["current_value"]: + self._check.gauge( + "postgresql.sequence.estimated_remaining", + row["max_value"] - row["current_value"], + tags=self._tags_no_db + + [ + "max_value:{:.0f}".format(row["max_value"]), + "current_value:{:.0f}".format(row["current_value"]), + "db:{}".format(dbname), + "schema:{}".format(row["schema_name"]), + "table:{}".format(row["table_name"]), + "column:{}".format(row["column_name"]), + ], + hostname=self._check.resolved_hostname, + raw=True, + ) + # TODO: We should eventually collect these on the backend for recommendations/visibility diff --git a/postgres/metadata.csv b/postgres/metadata.csv index 49183d67a61cc..42ae2d723e4f2 100644 --- a/postgres/metadata.csv +++ b/postgres/metadata.csv @@ -146,6 +146,7 @@ postgresql.rows_updated,gauge,,row,second,Enabled with `relations`. The number o postgresql.running,gauge,,,,The number of instances running.,0,postgres,running, postgresql.seq_rows_read,gauge,,row,second,"Enabled with `relations`. The number of live rows fetched by sequential scans. This metric is tagged with db, schema, table.",0,postgres,seq rows rd, postgresql.seq_scans,gauge,,scan,second,"Enabled with `relations`. The number of sequential scans initiated on this table. This metric is tagged with db, schema, table.",0,postgres,seq scans, +postgresql.sequence.estimated_remaining,gauge,,,,"The estimated remaining values of a sequence. This estimate is based on pg_statistics and will be more accurate for smaller tables and when ANALYZE has been run recently. This metric is tagged with db, schema, table, and column.",0,postgres,sequence remaining, postgresql.sessions.abandoned,count,,session,,Number of database sessions to this database that were terminated because connection to the client was lost. This metric is tagged with db.,-1,postgres,postgres sessions abandoned, postgresql.sessions.active_time,count,,millisecond,,"Time spent executing SQL statements in this database, in milliseconds (this corresponds to the states active and fastpath function call in pg_stat_activity). This metric is tagged with db.",0,postgres,postgres active time, postgresql.sessions.count,count,,session,,Total number of sessions established to this database. This metric is tagged with db.,0,postgres,postgres sessions, diff --git a/postgres/tests/compose/resources/02_setup.sh b/postgres/tests/compose/resources/02_setup.sh index aca2c6b034b14..89b0ea385ced3 100755 --- a/postgres/tests/compose/resources/02_setup.sh +++ b/postgres/tests/compose/resources/02_setup.sh @@ -15,6 +15,7 @@ psql -v ON_ERROR_STOP=1 --username "$POSTGRES_USER" "datadog_test" <<-'EOSQL' CREATE EXTENSION pg_buffercache SCHEMA public; CREATE EXTENSION pg_stat_statements SCHEMA public; GRANT SELECT ON pg_stat_statements TO datadog; + GRANT SELECT ON pg_statistic TO datadog; CREATE SCHEMA IF NOT EXISTS datadog; GRANT USAGE ON SCHEMA datadog TO datadog; diff --git a/postgres/tests/compose/resources/03_load_data.sh b/postgres/tests/compose/resources/03_load_data.sh index 637b4e4a0cdc9..c8dcc434bde1f 100755 --- a/postgres/tests/compose/resources/03_load_data.sh +++ b/postgres/tests/compose/resources/03_load_data.sh @@ -36,10 +36,13 @@ psql -v ON_ERROR_STOP=1 --username "$POSTGRES_USER" datadog_test <<-EOSQL SELECT * FROM persons; SELECT * FROM persons; SELECT * FROM persons; + VACUUM ANALYZE persons; CREATE SCHEMA public2; CREATE TABLE public2.cities (city VARCHAR(255), country VARCHAR(255), PRIMARY KEY(city)); GRANT ALL PRIVILEGES ON ALL TABLES IN SCHEMA public TO bob; GRANT ALL PRIVILEGES ON ALL TABLES IN SCHEMA public TO blocking_bob; + + EOSQL # Create publication for logical replication tests diff --git a/postgres/tests/test_metadata.py b/postgres/tests/test_metadata.py index c85a2ccafb6a2..62acfcfe23c6e 100644 --- a/postgres/tests/test_metadata.py +++ b/postgres/tests/test_metadata.py @@ -10,7 +10,7 @@ from datadog_checks.base.utils.db.utils import DBMAsyncJob from .common import POSTGRES_VERSION -from .utils import run_one_check +from .utils import requires_over_13, run_one_check pytestmark = [pytest.mark.integration, pytest.mark.usefixtures('dd_environment')] @@ -404,6 +404,36 @@ def test_collect_schemas_interrupted(integration_check, dbm_instance, aggregator assert len(database_metadata[0]['schemas'][0]['tables']) == 1 +@requires_over_13 +def test_collect_sequences(integration_check, dbm_instance, aggregator): + dbm_instance["collect_schemas"] = {'enabled': True, 'collection_interval': 0.5} + dbm_instance['relations'] = [] + dbm_instance["database_autodiscovery"] = {"enabled": True, "include": ["datadog"]} + del dbm_instance['dbname'] + + check = integration_check(dbm_instance) + run_one_check(check, dbm_instance) + aggregator.assert_metric( + "postgresql.sequence.estimated_remaining", + value=None, + tags=[ + "column:{}".format('personid'), + "schema:{}".format('public'), + "table:{}".format('persons'), + "db:{}".format('datadog_test'), + "max_value:{}".format(2147483647), + "current_value:{}".format(2), + "database_hostname:stubbed.hostname", + "foo:bar", + "port:5432", + "postgresql_cluster_name:primary", + f'postgresql_version:{check.raw_version}', + f'system_identifier:{check.system_identifier}', + "replication_role:master", + ], + ) + + def assert_fields(keys: List[str], fields: List[str]): for field in fields: assert field in keys