diff --git a/alerts/google-cloudsql/1p-cloudsql-instance-in-failed-state.v1.json b/alerts/google-cloudsql/1p-cloudsql-instance-in-failed-state.v1.json index c434a0ca30..532ca61011 100644 --- a/alerts/google-cloudsql/1p-cloudsql-instance-in-failed-state.v1.json +++ b/alerts/google-cloudsql/1p-cloudsql-instance-in-failed-state.v1.json @@ -1,7 +1,7 @@ { - "displayName": "CloudSQL - Instance in Failed State", + "displayName": "Cloud SQL - Instance in Failed State", "documentation": { - "content": "This Alert fires when any CloudSQL Instance has stopped working and has entered an error state. The cause should be investigated and the instance should be restored from a backup. for more information around managing instances and troubleshooting failed instances visit: https://cloud.google.com/sql/docs/troubleshooting#managing-instances", + "content": "This alert fires when any Cloud SQL instance has stopped working and has entered an error state. The cause should be investigated and the instance should be restored from a backup. For more information on managing instances and troubleshooting failed instances visit: https://cloud.google.com/sql/docs/troubleshooting#managing-instances", "mimeType": "text/markdown" }, "userLabels": {}, @@ -35,4 +35,4 @@ "combiner": "OR", "enabled": true, "notificationChannels": [] -} \ No newline at end of file +} diff --git a/alerts/google-cloudsql/1p-postgresql-slow-transactions.v1.json b/alerts/google-cloudsql/1p-postgresql-slow-transactions.v1.json index a4027f869f..ad3dadc5c5 100644 --- a/alerts/google-cloudsql/1p-postgresql-slow-transactions.v1.json +++ b/alerts/google-cloudsql/1p-postgresql-slow-transactions.v1.json @@ -1,7 +1,7 @@ { "displayName": "PostgreSQL - Slow Transactions", "documentation": { - "content": "This Alert fires if the database is having trouble keeping up transactions. You should investigate performance improvements, such as increasing resources for CloudSQL, improving query efficiency, and more. For additional information visit https://cloud.google.com/sql/docs/postgres/diagnose-issues.", + "content": "This alert fires if the database is having trouble keeping up with transactions. You should investigate performance improvements, such as increasing resources for Cloud SQL, improving query efficiency, and more. For additional information visit https://cloud.google.com/sql/docs/postgres/diagnose-issues.", "mimeType": "text/markdown" }, "userLabels": {}, @@ -31,4 +31,4 @@ "combiner": "OR", "enabled": true, "notificationChannels": [] -} \ No newline at end of file +} diff --git a/alerts/google-cloudsql/1p-replication-in-error-state.v1.json b/alerts/google-cloudsql/1p-replication-in-error-state.v1.json index 6a83ba8785..463a6de0b7 100644 --- a/alerts/google-cloudsql/1p-replication-in-error-state.v1.json +++ b/alerts/google-cloudsql/1p-replication-in-error-state.v1.json @@ -1,7 +1,7 @@ { "displayName": "Replication in Error State", "documentation": { - "content": "This Alert fires when any replica has stopped working and has entered an error state. For more information around disaster recovery visit: https://cloud.google.com/sql/docs/mysql/replication/cross-region-replicas.", + "content": "This alert fires when any replica has stopped working and has entered an error state. For more information on disaster recovery visit: https://cloud.google.com/sql/docs/mysql/replication/cross-region-replicas.", "mimeType": "text/markdown" }, "userLabels": {}, @@ -31,4 +31,4 @@ "combiner": "OR", "enabled": true, "notificationChannels": [] -} \ No newline at end of file +} diff --git a/alerts/google-cloudsql/README.md b/alerts/google-cloudsql/README.md index 7908954656..3263f6fce0 100644 --- a/alerts/google-cloudsql/README.md +++ b/alerts/google-cloudsql/README.md @@ -1,8 +1,8 @@ -# Alerts for CloudSQL in the Ops Agent +# Alerts for Cloud SQL in the Ops Agent ## Spiking Evictions -If `cloudsql.googleapis.com/database/postgresql/vacuum/oldest_transaction_age` is higher than `10` it indicates that postgres is having issues keeping up with the amount of queries. +If `cloudsql.googleapis.com/database/postgresql/vacuum/oldest_transaction_age` is higher than `10` it indicates that PostgreSQL is having issues keeping up with the number of queries. ## Replication in Error State @@ -14,7 +14,7 @@ If any instance in `cloudsql.googleapis.com/database/instance_state` has a state ### Creating Notification Channels and User Labels -Whether these alert policies are being used as standalones or base templates for a deployment strategy like terraform, one thing that should be utilized is notification channels and user labels. +Whether these alert policies are being used as standalones or base templates for a deployment strategy like Terraform, one thing that should be utilized is notification channels and user labels. ### User Labels diff --git a/alerts/google-cloudsql/metadata.yaml b/alerts/google-cloudsql/metadata.yaml index 7b57933ece..fb8327a4e7 100644 --- a/alerts/google-cloudsql/metadata.yaml +++ b/alerts/google-cloudsql/metadata.yaml @@ -1,8 +1,8 @@ alert_policy_templates: - id: 1p-cloudsql-instance-in-failed-state - display_name: CloudSQL - Instance in Failed State - description: "This Alert fires when any CloudSQL Instance has stopped working and has entered an error state. The cause should be investigated and the instance should be restored from a backup. for more information around managing instances and troubleshooting failed instances visit: https://cloud.google.com/sql/docs/troubleshooting#managing-instances" + display_name: Cloud SQL - Instance in Failed State + description: "This alert fires when any Cloud SQL instance has stopped working and has entered an error state. The cause should be investigated and the instance should be restored from a backup. For more information on managing instances and troubleshooting failed instances visit: https://cloud.google.com/sql/docs/troubleshooting#managing-instances" version: 1 related_integrations: - id: cloud_sql @@ -10,7 +10,7 @@ alert_policy_templates: - id: 1p-postgresql-slow-transactions display_name: PostgreSQL - Slow Transactions - description: "This Alert fires if the database is having trouble keeping up transactions. You should investigate performance improvements, such as increasing resources for CloudSQL, improving query efficiency, and more. For additional information visit https://cloud.google.com/sql/docs/postgres/diagnose-issues." + description: "This alert fires if the database is having trouble keeping up with transactions. You should investigate performance improvements, such as increasing resources for Cloud SQL, improving query efficiency, and more. For additional information visit https://cloud.google.com/sql/docs/postgres/diagnose-issues." version: 1 related_integrations: - id: cloud_sql @@ -18,7 +18,7 @@ alert_policy_templates: - id: 1p-replication-in-error-state display_name: Replication in Error State - description: "This Alert fires when any replica has stopped working and has entered an error state. For more information around disaster recovery visit: https://cloud.google.com/sql/docs/mysql/replication/cross-region-replicas." + description: "This alert fires when any replica has stopped working and has entered an error state. For more information on disaster recovery visit: https://cloud.google.com/sql/docs/mysql/replication/cross-region-replicas." version: 1 related_integrations: - id: cloud_sql diff --git a/dashboards/google-cloudsql/README.md b/dashboards/google-cloudsql/README.md index 181b567ced..957c0dc06b 100644 --- a/dashboards/google-cloudsql/README.md +++ b/dashboards/google-cloudsql/README.md @@ -1,20 +1,20 @@ -### Dashboards for CloudSQL +### Dashboards for Cloud SQL #### Notes - These dashboards are based on first party Google Cloud monitoring solutions. -|CloudSQL - General| +|Cloud SQL - General| |:------------------| |Filename: [cloudsql-general.json](cloudsql-general.json)| -|This dashboard has charts displaying logs from CloudSQL as well as charts of instance states and network throughput. | +|This dashboard has charts displaying logs from Cloud SQL as well as charts of instance states and network throughput. | -|CloudSQL - Replication| +|Cloud SQL - Replication| |:------------------| |Filename: [cloudsql-replication.json](cloudsql-replication.json)| -|This dashboard has charts displaying information about replication states and replication performance from CloudSQL. | +|This dashboard has charts displaying information about replication states and replication performance from Cloud SQL. | -|CloudSQL - Transactions| +|Cloud SQL - Transactions| |:------------------| |Filename: [cloudsql-transactions.json](cloudsql-transactions.json)| -|This dashboard has charts displaying information regarding transactions and queries from mysql, mssql, and postgresql in CloudSQL as well as charts relating to network activity. | +|This dashboard has charts displaying information regarding transactions and queries from MySQL, PostgreSQL, and SQL Server in Cloud SQL as well as charts relating to network activity. | diff --git a/dashboards/google-cloudsql/cloudsql-general.json b/dashboards/google-cloudsql/cloudsql-general.json index 36d88f52ca..dac0a66166 100644 --- a/dashboards/google-cloudsql/cloudsql-general.json +++ b/dashboards/google-cloudsql/cloudsql-general.json @@ -13,7 +13,7 @@ "labelKey": "database_id" } ], - "displayName": "CloudSQL - General", + "displayName": "Cloud SQL - General", "mosaicLayout": { "columns": 12, "tiles": [ @@ -110,7 +110,7 @@ "filter": "resource.type=\"cloudsql_database\"", "resourceNames": [] }, - "title": "All - CloudSQL Logs" + "title": "All - Cloud SQL Logs" }, "width": 4, "xPos": 4, @@ -123,7 +123,7 @@ "filter": "resource.type=\"cloudsql_database\"\nlogName=~\".*cloudsql.googleapis.com.*\"\nseverity>=ERROR", "resourceNames": [] }, - "title": "All - CloudSQL Database Error Logs" + "title": "All - Cloud SQL Database Error Logs" }, "width": 4, "xPos": 8, @@ -200,7 +200,7 @@ "height": 2, "widget": { "text": { - "content": "The below chart gives a count of how many CloudSQL instances are in each state. ", + "content": "The below chart gives a count of how many Cloud SQL instances are in each state. ", "format": "RAW" }, "title": "Instance States" @@ -239,10 +239,10 @@ "height": 2, "widget": { "text": { - "content": "This logs widget shows all the logs relating to CloudSQL database instances.", + "content": "This logs widget shows all the logs relating to Cloud SQL database instances.", "format": "RAW" }, - "title": "All - CloudSQL Logs" + "title": "All - Cloud SQL Logs" }, "width": 4, "xPos": 4, @@ -252,10 +252,10 @@ "height": 2, "widget": { "text": { - "content": "This logs widget shows all the logs relating to CloudSQL database instances at the error severity level.", + "content": "This logs widget shows all the logs relating to Cloud SQL database instances at the error severity level.", "format": "RAW" }, - "title": "All - CloudSQL Database Error Logs" + "title": "All - Cloud SQL Database Error Logs" }, "width": 4, "xPos": 8, @@ -265,7 +265,7 @@ "height": 2, "widget": { "text": { - "content": "This chart shows CloudSQL instances with the top 5 highest throughput received bytes.", + "content": "This chart shows Cloud SQL instances with the top 5 highest throughput received bytes.", "format": "RAW" }, "title": "Top 5 Highest Network Received Bytes" @@ -278,7 +278,7 @@ "height": 2, "widget": { "text": { - "content": "This chart shows CloudSQL instances with the top 5 highest throughput received bytes.", + "content": "This chart shows Cloud SQL instances with the top 5 highest throughput received bytes.", "format": "RAW" }, "title": "Top 5 Highest Network Sent Bytes" @@ -289,4 +289,4 @@ } ] } -} \ No newline at end of file +} diff --git a/dashboards/google-cloudsql/cloudsql-replication.json b/dashboards/google-cloudsql/cloudsql-replication.json index d434deb577..8ce1685955 100644 --- a/dashboards/google-cloudsql/cloudsql-replication.json +++ b/dashboards/google-cloudsql/cloudsql-replication.json @@ -13,7 +13,7 @@ "labelKey": "zone" } ], - "displayName": "CloudSQL - Replication", + "displayName": "Cloud SQL - Replication", "mosaicLayout": { "columns": 12, "tiles": [ @@ -185,7 +185,7 @@ "height": 2, "widget": { "text": { - "content": "Top 5 Replication instances with the highest CPU usage that indicates what replications are under the most load.", + "content": "Top 5 replication instances with the highest CPU usage that indicates what replications are under the most load.", "format": "RAW" }, "title": "Top 5 Replications with Highest CPU Usage" @@ -198,7 +198,7 @@ "height": 2, "widget": { "text": { - "content": "Top 5 Replication instances with the highest Memory usage that indicates what replications are under the most load.", + "content": "Top 5 replication instances with the highest memory usage that indicates what replications are under the most load.", "format": "RAW" }, "title": "Top 5 Replications with Highest Memory Usage" @@ -211,7 +211,7 @@ "height": 2, "widget": { "text": { - "content": "Top 5 Replicas that are the furthest behind the master node, in seconds.", + "content": "Top 5 replicas that are the furthest behind the master node, in seconds.", "format": "RAW" }, "title": "Top 5 Replications with Highest Replica Lag" @@ -224,7 +224,7 @@ "height": 2, "widget": { "text": { - "content": "Top 5 Replicas that are the furthest behind the master node, in seconds.", + "content": "Top 5 replicas that are the furthest behind the master node, in seconds.", "format": "RAW" }, "title": "Top 5 Replications with Highest Log Archive Failures" @@ -235,4 +235,4 @@ } ] } - } \ No newline at end of file + } diff --git a/dashboards/google-cloudsql/cloudsql-transactions.json b/dashboards/google-cloudsql/cloudsql-transactions.json index 7d11e7c139..6d98c21cf3 100644 --- a/dashboards/google-cloudsql/cloudsql-transactions.json +++ b/dashboards/google-cloudsql/cloudsql-transactions.json @@ -13,7 +13,7 @@ "labelKey": "database_id" } ], - "displayName": "CloudSQL - Transactions", + "displayName": "Cloud SQL - Transactions", "mosaicLayout": { "columns": 12, "tiles": [ @@ -210,7 +210,7 @@ "height": 2, "widget": { "text": { - "content": "The top 5 highest connections on postgreSQL instances", + "content": "The top 5 highest connections on PostgreSQL instances", "format": "RAW" }, "title": "PostgreSQL - Top 5 Highest Connections" @@ -262,7 +262,7 @@ "height": 2, "widget": { "text": { - "content": "The top 5 PostgreSQL instances with highest amount of rows being altered.", + "content": "The top 5 PostgreSQL instances with highest number of rows being altered.", "format": "RAW" }, "title": "PostgreSQL - Top 5 Highest DB Rows Affected" @@ -288,7 +288,7 @@ "height": 2, "widget": { "text": { - "content": "Top 5 instances that have the highest amount of queries executed against the db.", + "content": "Top 5 instances that have the highest number of queries executed against the db.", "format": "RAW" }, "title": "MySQL - Top 5 Highest Queries" @@ -299,4 +299,4 @@ } ] } - } \ No newline at end of file + } diff --git a/dashboards/google-cloudsql/metadata.yaml b/dashboards/google-cloudsql/metadata.yaml index 8ce5635a24..25aaba4b18 100644 --- a/dashboards/google-cloudsql/metadata.yaml +++ b/dashboards/google-cloudsql/metadata.yaml @@ -2,7 +2,7 @@ sample_dashboards: - category: Cloud SQL id: cloudsql-general - display_name: CloudSQL - General + display_name: Cloud SQL - General description: |- This dashboard has charts displaying logs from Cloud SQL as well as charts of instance states and network throughput. related_integrations: @@ -11,7 +11,7 @@ sample_dashboards: - category: Cloud SQL id: cloudsql-replication - display_name: CloudSQL - Replication + display_name: Cloud SQL - Replication description: |- This dashboard has charts displaying information about replication states and replication performance from Cloud SQL. related_integrations: @@ -20,9 +20,9 @@ sample_dashboards: - category: Cloud SQL id: cloudsql-transactions - display_name: CloudSQL - Transactions + display_name: Cloud SQL - Transactions description: |- - This dashboard has charts displaying information regarding transactions and queries from mysql, mssql, and postgresql in Cloud SQL as well as charts relating to network activity. + This dashboard has charts displaying information regarding transactions and queries from MySQL, PostgreSQL, and SQL Server in Cloud SQL as well as charts relating to network activity. related_integrations: - id: cloud_sql platform: GCP diff --git a/dashboards/logging/README.md b/dashboards/logging/README.md index cdc7e54c1a..9959c5e272 100644 --- a/dashboards/logging/README.md +++ b/dashboards/logging/README.md @@ -29,7 +29,7 @@ |Logging Usage - GCE| |:-----------------------| |Filename: [gce-usage.json](gce-usage.json)| -|This dashboard is fairly simple in that it primarily looks at the `Log Bytes Sent` and `Log Entries` metrics but also adds in some additional visualizations of `Entries By Severity`.| +|This dashboard is fairly simple in that it primarily looks at the `Log Bytes Sent` and `Log Entries` metrics but also adds in some additional visualizations of `Entries by Severity`.|   @@ -37,7 +37,7 @@ |Logging Usage - Cloud SQL| |:-----------------------| |Filename: [cloudsql-usage.json](cloudsql-usage.json)| -|This dashboard primarily looks at the `Log Bytes Sent` and `Log Entries` metrics but also adds in some additional visualizations of `Entries By Severity` for monitored resources of `cloudsql_database` and `cloudsql_instance_database`.| +|This dashboard primarily looks at the `Log Bytes Sent` and `Log Entries` metrics but also adds in some additional visualizations of `Entries by Severity` for monitored resources of `cloudsql_database` and `cloudsql_instance_database`.|   diff --git a/dashboards/logging/cloudsql-usage.json b/dashboards/logging/cloudsql-usage.json index 844e59350c..d6d7db2ec4 100644 --- a/dashboards/logging/cloudsql-usage.json +++ b/dashboards/logging/cloudsql-usage.json @@ -146,7 +146,7 @@ { "height": 4, "widget": { - "title": "Log Bytes By Severity", + "title": "Log Bytes by Severity", "xyChart": { "chartOptions": { "mode": "COLOR" diff --git a/dashboards/logging/gce-usage.json b/dashboards/logging/gce-usage.json index 699227368e..263026d2a1 100644 --- a/dashboards/logging/gce-usage.json +++ b/dashboards/logging/gce-usage.json @@ -104,7 +104,7 @@ { "height": 4, "widget": { - "title": "Entries By Severity", + "title": "Entries by Severity", "xyChart": { "chartOptions": { "mode": "COLOR" diff --git a/dashboards/logging/metadata.yaml b/dashboards/logging/metadata.yaml index 8dbc2ff9ff..f295b040c2 100644 --- a/dashboards/logging/metadata.yaml +++ b/dashboards/logging/metadata.yaml @@ -18,12 +18,12 @@ sample_dashboards: category: Logging id: gce-usage display_name: Logging Usage - GCE - description: "This dashboard is fairly simple in that it primarily looks at the Log Bytes Sent and Log Entries metrics but also adds in some additional visualizations of Entries By Severity. These metrics are populated via [Google system logging metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-logging)." + description: "This dashboard is fairly simple in that it primarily looks at the Log Bytes Sent and Log Entries metrics but also adds in some additional visualizations of Entries by Severity. These metrics are populated via [Google system logging metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-logging)." - category: Logging id: cloudsql-usage display_name: Logging Usage - Cloud SQL - description: "This dashboard primarily looks at the Log Bytes Sent and Log Entries metrics but also adds in some additional visualizations of Entries By Severity for monitored resources of cloudsql_database and cloudsql_instance_database. These metrics are populated via [Google system logging metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-logging)." + description: "This dashboard primarily looks at the Log Bytes Sent and Log Entries metrics but also adds in some additional visualizations of Entries by Severity for monitored resources of cloudsql_database and cloudsql_instance_database. These metrics are populated via [Google system logging metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-logging)." - category: Logging id: dataflow-usage diff --git a/dashboards/storage/README.md b/dashboards/storage/README.md index 3740b4f0df..62418a1ac8 100644 --- a/dashboards/storage/README.md +++ b/dashboards/storage/README.md @@ -22,14 +22,14 @@   -|Cloud SQL(MySQL) Monitoring| +|Cloud SQL (MySQL) Monitoring| |:--------------------------| |Filename: [cloudsql-mysql-monitoring.json](cloudsql-mysql-monitoring.json)| |This dashboard has 6 charts for the [Cloud SQL(MySQL) metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-cloudsql), including `Database queries`, `Connections`, `Network bytes received/sent`, and the `InnoDB page` metrics.   -|Cloud SQL(PostgreSQL) Monitoring| +|Cloud SQL (PostgreSQL) Monitoring| |:-------------------------------| |Filename: [cloudsql-postgre-monitoring.json](cloudsql-postgre-monitoring.json) |This dashboard has 3 charts for the [Cloud SQL(PostgreSQL) metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-cloudsql), including `Number of transactions`, `Connections`, and `Lag bytes`. @@ -64,7 +64,7 @@   -|Redis Stats monitoring| +|Redis Stats Monitoring| |:---------------------| |Filename: [redis-stats-monitoring.json](redis-stats-monitoring.json)| |This dashboard has 14 charts for the stats of [Memorystore for Redis](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-redis), including `Hits`, `Misses`, `Cache Hit Ratio`, `Evicted Keys`, `Expired Keys`, `Memory Usage Ratio`, and others. @@ -74,4 +74,4 @@ |Spanner Monitoring| |:-----------------| |Filename: [spanner-monitoring.json](spanner-monitoring.json)| -|This dashboard has 14 charts for the [Cloud Spanner metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-spanner), including `Count of queries by database`, `API requests by method`, `API bytes sent/received`, CPU and storage utilization, etc. \ No newline at end of file +|This dashboard has 14 charts for the [Cloud Spanner metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-spanner), including `Count of queries by database`, `API requests by method`, `API bytes sent/received`, CPU and storage utilization, etc. diff --git a/dashboards/storage/cloudsql-monitoring.json b/dashboards/storage/cloudsql-monitoring.json index 8ed335d5e6..becff360a6 100644 --- a/dashboards/storage/cloudsql-monitoring.json +++ b/dashboards/storage/cloudsql-monitoring.json @@ -152,7 +152,7 @@ } }, { - "title": "Total Memory quota, Memory usage", + "title": "Total memory quota, memory usage", "xyChart": { "chartOptions": { "mode": "COLOR" @@ -255,7 +255,7 @@ } }, { - "title": "Total Disk quota, Bytes used", + "title": "Total disk quota, bytes used", "xyChart": { "chartOptions": { "mode": "COLOR" diff --git a/dashboards/storage/cloudsql-mysql-monitoring.json b/dashboards/storage/cloudsql-mysql-monitoring.json index 8658eab0b3..3f070b1a8a 100644 --- a/dashboards/storage/cloudsql-mysql-monitoring.json +++ b/dashboards/storage/cloudsql-mysql-monitoring.json @@ -1,5 +1,5 @@ { - "displayName": "Cloud SQL(MySQL) Monitoring", + "displayName": "Cloud SQL (MySQL) Monitoring", "gridLayout": { "columns": "2", "widgets": [ diff --git a/dashboards/storage/cloudsql-postgre-monitoring.json b/dashboards/storage/cloudsql-postgre-monitoring.json index ad38069150..038f3c7278 100644 --- a/dashboards/storage/cloudsql-postgre-monitoring.json +++ b/dashboards/storage/cloudsql-postgre-monitoring.json @@ -1,5 +1,5 @@ { - "displayName": "Cloud SQL(PostgreSQL) Monitoring", + "displayName": "Cloud SQL (PostgreSQL) Monitoring", "gridLayout": { "columns": "2", "widgets": [ @@ -32,7 +32,7 @@ } }, { - "title": "PostgreSQL Connections", + "title": "PostgreSQL connections", "xyChart": { "chartOptions": { "mode": "COLOR" diff --git a/dashboards/storage/metadata.yaml b/dashboards/storage/metadata.yaml index 6df6a13742..566ac40dda 100644 --- a/dashboards/storage/metadata.yaml +++ b/dashboards/storage/metadata.yaml @@ -15,18 +15,18 @@ sample_dashboards: display_name: Cloud SQL Monitoring description: |- This dashboard has 10 charts for the related [Cloud SQL metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-cloudsql), including Instance state, Server up, and CPU/Memory/Disk utilization etc. - This dashboard provides an aggregate view of total resources of your SQL databases. + This dashboard provides an aggregate view of total resources of your SQL databases. You can use database engine-specific dashboards for additional metrics of different database engines such as MySQL and PostgreSQL. - category: Storage id: cloudsql-mysql-monitoring - display_name: Cloud SQL(MySQL) Monitoring - description: "This dashboard has 6 charts for the [Cloud SQL(MySQL) metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-cloudsql), including Database queries, Connections, Network bytes received/sent, and the InnoDB page metrics." + display_name: Cloud SQL (MySQL) Monitoring + description: "This dashboard has 6 charts for the [Cloud SQL (MySQL) metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-cloudsql), including Database queries, Connections, Network bytes received/sent, and the InnoDB page metrics." - category: Storage id: cloudsql-postgre-monitoring - display_name: Cloud SQL(PostgreSQL) Monitoring - description: "This dashboard has 3 charts for the [Cloud SQL(PostgreSQL) metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-cloudsql), including Number of transactions, Connections, and Lag bytes." + display_name: Cloud SQL (PostgreSQL) Monitoring + description: "This dashboard has 3 charts for the [Cloud SQL (PostgreSQL) metrics](https://cloud.google.com/monitoring/api/metrics_gcp#gcp-cloudsql), including Number of transactions, Connections, and Lag bytes." - category: Storage id: datastore-monitoring diff --git a/dashboards/zookeeper/README.md b/dashboards/zookeeper/README.md index 559031edc1..ee0361f55d 100644 --- a/dashboards/zookeeper/README.md +++ b/dashboards/zookeeper/README.md @@ -13,4 +13,4 @@ |Zookeeper Prometheus| |:------------------| |Filename: [zookeeper-prometheus.json](zookeeper-prometheus.json)| -|This dashboard is based on [built-in prometheus metrics](https://zookeeper.apache.org/doc/r3.6.3/zookeeperMonitor.html). This dashboard includes charts displaying: `Uptime`, `ZNodes Total Memory (GB)`, `ZNodes`, `Connections`, `Watch Count`, `Leader Elections Counter`, `Open File Descriptors`, `Fsync Time (ms)`, `Snapshot Time (ms)`, `Average Latency (ms)`, and `JVM Memory`| +|This dashboard is based on [built-in prometheus metrics](https://zookeeper.apache.org/doc/r3.6.3/zookeeperMonitor.html). This dashboard includes charts displaying: `Average Uptime (Days)`, `ZNodes Total Memory (GB)`, `ZNodes`, `Connections`, `Watch Count`, `Leader Elections Counter`, `Open File Descriptors`, `Fsync Time (ms)`, `Snapshot Time (ms)`, `Average Latency (ms)`, `JVM Memory Utilization`, `JVM Threads Deadlocked`, `JVM Garbage Collection Seconds`, `JVM Memory Pool Allocated Bytes`, and `JVM Theads State` | diff --git a/dashboards/zookeeper/metadata.yaml b/dashboards/zookeeper/metadata.yaml index 1a20d47dd7..42acccee1e 100644 --- a/dashboards/zookeeper/metadata.yaml +++ b/dashboards/zookeeper/metadata.yaml @@ -11,7 +11,7 @@ sample_dashboards: category: Zookeeper id: zookeeper-prometheus display_name: Zookeeper Prometheus Overview - description: "This dashboard is based on [built-in prometheus metrics](https://zookeeper.apache.org/doc/r3.6.3/zookeeperMonitor.html). This dashboard includes charts displaying: Uptime, ZNodes Total Memory (GB), ZNodes, Connections, Watch Count, Leader Elections Counter, Open File Descriptors, Fsync Time (ms), Snapshot Time (ms), Average Latency (ms), and JVM Memory" + description: "This dashboard is based on [built-in prometheus metrics](https://zookeeper.apache.org/doc/r3.6.3/zookeeperMonitor.html). This dashboard includes charts displaying: Average Uptime (Days), ZNodes Total Memory (GB), ZNodes, Connections, Watch Count, Leader Elections Counter, Open File Descriptors, Fsync Time (ms), Snapshot Time (ms), Average Latency (ms), JVM Memory Utilization, JVM Threads Deadlocked, JVM Garbage Collection Seconds, JVM Memory Pool Allocated Bytes, and JVM Threads State." related_integrations: - id: zookeeper platform: GKE diff --git a/dashboards/zookeeper/zookeeper-prometheus.json b/dashboards/zookeeper/zookeeper-prometheus.json index 87bcd91bfc..92b4dadc6c 100644 --- a/dashboards/zookeeper/zookeeper-prometheus.json +++ b/dashboards/zookeeper/zookeeper-prometheus.json @@ -1,5 +1,5 @@ { - "category": "CUSTOM", + "displayName": "Zookeeper Prometheus Overview", "dashboardFilters": [ { "filterType": "RESOURCE_LABEL", @@ -17,226 +17,243 @@ "templateVariable": "Namespace" } ], - "displayName": "Zookeeper Prometheus Overview", - "labels": {}, "mosaicLayout": { - "columns": 12, + "columns": 48, "tiles": [ { - "height": 2, + "width": 8, + "height": 8, "widget": { + "title": "Average Uptime (Days)", "scorecard": { "gaugeView": { + "lowerBound": 0, "upperBound": 1000 }, "thresholds": [ { "color": "RED", "direction": "ABOVE", + "label": "", "value": 730 }, - { - "color": "RED", - "direction": "BELOW", - "value": 0 - }, { "color": "YELLOW", "direction": "ABOVE", + "label": "", "value": 365 } ], "timeSeriesQuery": { - "prometheusQuery": "sum(uptime{${Cluster},${Location},${Namespace}}) / count(uptime{${Cluster},${Location},${Namespace}}) / 86400 / 1000" + "prometheusQuery": "sum(uptime{${Cluster},${Location},${Namespace}}) / count(uptime{${Cluster},${Location},${Namespace}}) / 86400 / 1000", + "unitOverride": "" } - }, - "title": "Average Uptime (days)" - }, - "width": 2, - "xPos": 0, - "yPos": 0 + } + } }, { - "height": 2, + "xPos": 16, + "width": 8, + "height": 8, "widget": { + "title": "ZNodes", "scorecard": { "gaugeView": { + "lowerBound": 0, "upperBound": 1000 }, "thresholds": [ { "color": "RED", "direction": "ABOVE", + "label": "", "value": 750 }, { "color": "RED", "direction": "BELOW", + "label": "", "value": 1 }, { "color": "YELLOW", "direction": "ABOVE", + "label": "", "value": 500 } ], "timeSeriesQuery": { - "prometheusQuery": "sum(znode_count{${Cluster},${Location},${Namespace}})" + "prometheusQuery": "sum(znode_count{${Cluster},${Location},${Namespace}})", + "unitOverride": "" } - }, - "title": "ZNodes" - }, - "width": 2, - "xPos": 0, - "yPos": 2 + } + } }, { - "height": 2, + "yPos": 20, + "width": 24, + "height": 8, "widget": { - "scorecard": { - "gaugeView": { - "upperBound": 65 + "title": "Connections", + "xyChart": { + "chartOptions": { + "mode": "COLOR" }, - "thresholds": [ - { - "color": "RED", - "direction": "ABOVE", - "value": 50 - }, + "dataSets": [ { - "color": "YELLOW", - "direction": "ABOVE", - "value": 40 + "breakdowns": [], + "dimensions": [], + "measures": [], + "plotType": "LINE", + "targetAxis": "Y1", + "timeSeriesQuery": { + "prometheusQuery": "sum(num_alive_connections{${Cluster},${Location},${Namespace}})", + "unitOverride": "" + } } ], - "timeSeriesQuery": { - "prometheusQuery": "sum(num_alive_connections{${Cluster},${Location},${Namespace}})" + "thresholds": [], + "yAxis": { + "label": "", + "scale": "LINEAR" } - }, - "title": "Connections" - }, - "width": 2, - "xPos": 2, - "yPos": 2 + } + } }, { - "height": 2, + "xPos": 8, + "width": 8, + "height": 8, "widget": { + "title": "ZNodes Total Memory (GB)", "scorecard": { "gaugeView": { + "lowerBound": 0, "upperBound": 1 }, "thresholds": [ { "color": "RED", "direction": "ABOVE", + "label": "", "value": 0.65 }, { "color": "YELLOW", "direction": "ABOVE", + "label": "", "value": 0.5 } ], "timeSeriesQuery": { - "prometheusQuery": "sum(approximate_data_size{${Cluster},${Location},${Namespace}} / 1024)" + "prometheusQuery": "sum(approximate_data_size{${Cluster},${Location},${Namespace}} / 1024)", + "unitOverride": "" } - }, - "title": "ZNodes Total Memory (GB)" - }, - "width": 2, - "xPos": 2, - "yPos": 0 + } + } }, { - "height": 2, + "xPos": 8, + "yPos": 8, + "width": 8, + "height": 8, "widget": { + "title": "Watch Count", "scorecard": { "gaugeView": { + "lowerBound": 0, "upperBound": 20000 }, "thresholds": [ { "color": "RED", "direction": "ABOVE", + "label": "", "value": 9000 }, { "color": "YELLOW", "direction": "ABOVE", + "label": "", "value": 5000 } ], "timeSeriesQuery": { - "prometheusQuery": "sum(watch_count{${Cluster},${Location},${Namespace}})" + "prometheusQuery": "sum(watch_count{${Cluster},${Location},${Namespace}})", + "unitOverride": "" } - }, - "title": "Watch Count" - }, - "width": 2, - "xPos": 0, - "yPos": 4 + } + } }, { - "height": 2, + "xPos": 16, + "yPos": 8, + "width": 8, + "height": 8, "widget": { + "title": "Leader Elections Counter", "scorecard": { "gaugeView": { + "lowerBound": 0, "upperBound": 1 }, "thresholds": [ { "color": "RED", "direction": "ABOVE", + "label": "", "value": 0.65 }, { "color": "YELLOW", "direction": "ABOVE", + "label": "", "value": 0.5 } ], "timeSeriesQuery": { - "prometheusQuery": "sum(increase(election_time_count{${Cluster},${Location},${Namespace}}[5m]))" + "prometheusQuery": "sum(increase(election_time_count{${Cluster},${Location},${Namespace}}[5m]))", + "unitOverride": "" } - }, - "title": "Leader Elections Counter" - }, - "width": 2, - "xPos": 2, - "yPos": 4 + } + } }, { - "height": 2, + "yPos": 8, + "width": 8, + "height": 8, "widget": { + "title": "Open File Descriptors", "scorecard": { "gaugeView": { + "lowerBound": 0, "upperBound": 1000 }, "thresholds": [ { "color": "RED", "direction": "ABOVE", + "label": "", "value": 600 }, { "color": "YELLOW", "direction": "ABOVE", + "label": "", "value": 300 } ], "timeSeriesQuery": { - "prometheusQuery": "sum(open_file_descriptor_count{${Cluster},${Location},${Namespace}})" + "prometheusQuery": "sum(open_file_descriptor_count{${Cluster},${Location},${Namespace}})", + "unitOverride": "" } - }, - "title": "Open File Descriptors" - }, - "width": 4, - "xPos": 0, - "yPos": 6 + } + } }, { - "height": 4, + "yPos": 44, + "width": 24, + "height": 8, "widget": { "title": "Fsync Time (ms)", "xyChart": { @@ -245,31 +262,36 @@ }, "dataSets": [ { + "breakdowns": [], + "dimensions": [], + "measures": [], "plotType": "LINE", "targetAxis": "Y1", "timeSeriesQuery": { - "prometheusQuery": "rate(fsynctime_sum{${Cluster},${Location},${Namespace}}[1m])" + "prometheusQuery": "rate(fsynctime_sum{${Cluster},${Location},${Namespace}}[1m])", + "unitOverride": "" } } ], "thresholds": [ { + "label": "", "targetAxis": "Y1", "value": 100 } ], "timeshiftDuration": "0s", "yAxis": { + "label": "", "scale": "LINEAR" } } - }, - "width": 4, - "xPos": 4, - "yPos": 0 + } }, { - "height": 4, + "yPos": 36, + "width": 24, + "height": 8, "widget": { "title": "Snapshot Time (ms)", "xyChart": { @@ -278,31 +300,36 @@ }, "dataSets": [ { + "breakdowns": [], + "dimensions": [], + "measures": [], "plotType": "LINE", "targetAxis": "Y1", "timeSeriesQuery": { - "prometheusQuery": "rate(snapshottime_sum{${Cluster},${Location},${Namespace}}[5m])" + "prometheusQuery": "rate(snapshottime_sum{${Cluster},${Location},${Namespace}}[5m])", + "unitOverride": "" } } ], "thresholds": [ { + "label": "", "targetAxis": "Y1", "value": 100 } ], "timeshiftDuration": "0s", "yAxis": { + "label": "", "scale": "LINEAR" } } - }, - "width": 4, - "xPos": 4, - "yPos": 4 + } }, { - "height": 4, + "yPos": 28, + "width": 24, + "height": 8, "widget": { "title": "Average Latency (ms)", "xyChart": { @@ -311,62 +338,238 @@ }, "dataSets": [ { + "breakdowns": [], + "dimensions": [], + "measures": [], "plotType": "LINE", "targetAxis": "Y1", "timeSeriesQuery": { - "prometheusQuery": "avg_latency{${Cluster},${Location},${Namespace}}" + "prometheusQuery": "avg_latency{${Cluster},${Location},${Namespace}}", + "unitOverride": "" } } ], "thresholds": [ { + "label": "", "targetAxis": "Y1", "value": 100 } ], "timeshiftDuration": "0s", "yAxis": { + "label": "", "scale": "LINEAR" } } - }, - "width": 4, - "xPos": 8, - "yPos": 0 + } }, { - "height": 4, + "xPos": 24, + "yPos": 20, + "width": 24, + "height": 8, "widget": { - "title": "JVM Memory", + "title": "JVM Memory Utilization", "xyChart": { "chartOptions": { "mode": "COLOR" }, "dataSets": [ { + "breakdowns": [], + "dimensions": [], + "measures": [], "plotType": "LINE", "targetAxis": "Y1", "timeSeriesQuery": { - "prometheusQuery": "jvm_memory_bytes_used{${Cluster},${Location},${Namespace}} / jvm_memory_bytes_max{area=\"heap\",${Cluster},${Location},${Namespace}}" + "prometheusQuery": "jvm_memory_bytes_used{${Cluster},${Location},${Namespace}} / jvm_memory_bytes_max{area=\"heap\",${Cluster},${Location},${Namespace}}", + "unitOverride": "" } } ], "thresholds": [ { + "label": "", "targetAxis": "Y1", "value": 0.8 } ], "timeshiftDuration": "0s", "yAxis": { + "label": "", "scale": "LINEAR" } } - }, - "width": 4, - "xPos": 8, - "yPos": 4 + } + }, + { + "xPos": 24, + "width": 24, + "height": 16, + "widget": { + "title": "JVM Threads State", + "pieChart": { + "chartType": "DONUT", + "dataSets": [ + { + "timeSeriesQuery": { + "outputFullDuration": true, + "prometheusQuery": "jvm_threads_state{${Cluster},${Location},${Namespace}}", + "unitOverride": "" + } + } + ], + "sliceAggregatedThreshold": 0 + } + } + }, + { + "yPos": 16, + "width": 24, + "height": 4, + "widget": { + "title": "Zookeeper", + "text": { + "content": "", + "format": "MARKDOWN", + "style": { + "backgroundColor": "#FFFFFF", + "fontSize": "FS_LARGE", + "horizontalAlignment": "H_LEFT", + "padding": "P_EXTRA_SMALL", + "pointerLocation": "POINTER_LOCATION_UNSPECIFIED", + "textColor": "#212121", + "verticalAlignment": "V_TOP" + } + } + } + }, + { + "xPos": 24, + "yPos": 16, + "width": 24, + "height": 4, + "widget": { + "title": "JVM", + "text": { + "content": "", + "format": "MARKDOWN", + "style": { + "backgroundColor": "#FFFFFF", + "fontSize": "FS_LARGE", + "horizontalAlignment": "H_LEFT", + "padding": "P_EXTRA_SMALL", + "pointerLocation": "POINTER_LOCATION_UNSPECIFIED", + "textColor": "#212121", + "verticalAlignment": "V_TOP" + } + } + } + }, + { + "xPos": 24, + "yPos": 28, + "width": 24, + "height": 8, + "widget": { + "title": "JVM Threads Deadlocked", + "xyChart": { + "chartOptions": { + "mode": "COLOR" + }, + "dataSets": [ + { + "breakdowns": [], + "dimensions": [], + "measures": [], + "plotType": "LINE", + "targetAxis": "Y1", + "timeSeriesQuery": { + "prometheusQuery": "jvm_threads_deadlocked{${Cluster},${Location},${Namespace}}", + "unitOverride": "" + } + } + ], + "thresholds": [ + { + "label": "", + "targetAxis": "Y1", + "value": 1 + } + ], + "yAxis": { + "label": "", + "scale": "LINEAR" + } + } + } + }, + { + "xPos": 24, + "yPos": 44, + "width": 24, + "height": 8, + "widget": { + "title": "JVM Memory Pool Allocated Bytes", + "xyChart": { + "chartOptions": { + "mode": "COLOR" + }, + "dataSets": [ + { + "breakdowns": [], + "dimensions": [], + "measures": [], + "plotType": "LINE", + "targetAxis": "Y1", + "timeSeriesQuery": { + "prometheusQuery": "jvm_memory_pool_allocated_bytes_total{${Cluster},${Location},${Namespace}}", + "unitOverride": "" + } + } + ], + "thresholds": [], + "yAxis": { + "label": "", + "scale": "LINEAR" + } + } + } + }, + { + "xPos": 24, + "yPos": 36, + "width": 24, + "height": 8, + "widget": { + "title": "JVM Garbage Collection Seconds", + "xyChart": { + "chartOptions": { + "mode": "COLOR" + }, + "dataSets": [ + { + "breakdowns": [], + "dimensions": [], + "measures": [], + "plotType": "LINE", + "targetAxis": "Y1", + "timeSeriesQuery": { + "prometheusQuery": "jvm_gc_collection_seconds_sum{${Cluster},${Location},${Namespace}}", + "unitOverride": "" + } + } + ], + "thresholds": [], + "yAxis": { + "label": "", + "scale": "LINEAR" + } + } + } } ] - } + }, + "labels": {} } diff --git a/dashboards/zookeeper/zookeeper-prometheus.png b/dashboards/zookeeper/zookeeper-prometheus.png index dbb03ff355..e483e0ba73 100644 Binary files a/dashboards/zookeeper/zookeeper-prometheus.png and b/dashboards/zookeeper/zookeeper-prometheus.png differ diff --git a/integrations/zookeeper/prometheus_metadata.yaml b/integrations/zookeeper/prometheus_metadata.yaml index 8458b21181..ea7d116146 100644 --- a/integrations/zookeeper/prometheus_metadata.yaml +++ b/integrations/zookeeper/prometheus_metadata.yaml @@ -57,4 +57,20 @@ platforms: prometheus_name: jvm_memory_bytes_max kind: GAUGE value_type: DOUBLE + - name: prometheus.googleapis.com/jvm_threads_state/gauge + prometheus_name: jvm_threads_state + kind: GAUGE + value_type: DOUBLE + - name: prometheus.googleapis.com/jvm_threads_deadlocked/gauge + prometheus_name: jvm_threads_deadlocked + kind: GAUGE + value_type: DOUBLE + - name: prometheus.googleapis.com/jvm_gc_collection_seconds_sum/summary:counter + prometheus_name: jvm_gc_collection_seconds_sum + kind: CUMULATIVE + value_type: DOUBLE + - name: prometheus.googleapis.com/jvm_memory_pool_allocated_bytes_total/counter + prometheus_name: jvm_memory_pool_allocated_bytes_total + kind: CUMULATIVE + value_type: DOUBLE install_documentation_url: https://cloud.google.com/stackdriver/docs/managed-prometheus/exporters/zookeeper