diff options
author | Ilya Mashchenko <ilya@netdata.cloud> | 2020-01-31 10:38:44 +0300 |
---|---|---|
committer | GitHub <noreply@github.com> | 2020-01-31 10:38:44 +0300 |
commit | 29d9b5e51603792ee27ef5a21f1de0ba8e130158 (patch) | |
tree | f976f869aa8343e471fe8a03205aebd3c0dd3845 | |
parent | a6976f49df8dbdb6521f7cbf9e7983312c652a30 (diff) |
installer: include go.d.plugin version v0.15.0 (#7882)
* /web/giu/dashboard_info.js: add cockroachdb info
* /web/giu/dashboard_info.js: lgtm fix
* /health/health.d/: add cockroachdb.conf
-rw-r--r-- | health/Makefile.am | 1 | ||||
-rw-r--r-- | health/health.d/cockroachdb.conf | 91 | ||||
-rw-r--r-- | packaging/go.d.checksums | 32 | ||||
-rw-r--r-- | packaging/go.d.version | 2 | ||||
-rw-r--r-- | web/gui/dashboard_info.js | 184 |
5 files changed, 292 insertions, 18 deletions
diff --git a/health/Makefile.am b/health/Makefile.am index ccd36bf1b7..853ed0d708 100644 --- a/health/Makefile.am +++ b/health/Makefile.am @@ -37,6 +37,7 @@ dist_healthconfig_DATA = \ health.d/ceph.conf \ health.d/cgroups.conf \ health.d/cpu.conf \ + health.d/cockroachdb.conf \ health.d/couchdb.conf \ health.d/disks.conf \ health.d/dnsmasq_dhcp.conf \ diff --git a/health/health.d/cockroachdb.conf b/health/health.d/cockroachdb.conf new file mode 100644 index 0000000000..8ab2c9d0f7 --- /dev/null +++ b/health/health.d/cockroachdb.conf @@ -0,0 +1,91 @@ + +# Availability + +template: cockroachdb_last_collected_secs + on: cockroachdb.live_nodes + calc: $now - $last_collected_t + units: seconds ago + every: 10s + warn: $this > (($status >= $WARNING) ? ($update_every) : ( 5 * $update_every)) + crit: $this > (($status == $CRITICAL) ? ($update_every) : (60 * $update_every)) + delay: down 5m multiplier 1.5 max 1h + info: number of seconds since the last successful data collection + to: dba + +# Capacity + +template: cockroachdb_used_storage_capacity + on: cockroachdb.storage_used_capacity_percentage + calc: $capacity_used_percent + units: % + every: 10s + warn: $this > (($status >= $WARNING) ? (80) : (85)) + crit: $this > (($status == $CRITICAL) ? (85) : (95)) + delay: down 15m multiplier 1.5 max 1h + info: entire disk usage percentage + to: dba + +template: cockroachdb_used_usable_storage_capacity + on: cockroachdb.storage_used_capacity_percentage + calc: $capacity_usable_used_percent + units: % + every: 10s + warn: $this > (($status >= $WARNING) ? (80) : (85)) + crit: $this > (($status == $CRITICAL) ? (85) : (95)) + delay: down 15m multiplier 1.5 max 1h + info: usable space usage percentage + to: dba + +# Replication + +template: cockroachdb_unavailable_ranges + on: cockroachdb.ranges_replication_problem + calc: $ranges_unavailable + units: num + every: 10s + warn: $this > 0 + delay: down 15m multiplier 1.5 max 1h + info: number of ranges with fewer live replicas than the replication target + to: dba + +template: cockroachdb_replicas_leaders_not_leaseholders + on: cockroachdb.replicas_leaders + calc: $replicas_leaders_not_leaseholders + units: num + every: 10s + warn: $this > 0 + delay: down 15m multiplier 1.5 max 1h + info: number of replicas that are Raft leaders whose range lease is held by another store + to: dba + +# FD + +template: cockroachdb_open_file_descriptors_limit + on: cockroachdb.process_file_descriptors + calc: $sys_fd_open/$sys_fd_softlimit * 100 + units: % + every: 10s + warn: $this > 80 + delay: down 15m multiplier 1.5 max 1h + info: open file descriptors usage percentage + to: dba + +# SQL + +template: cockroachdb_sql_active_connections + on: cockroachdb.sql_connections + calc: $sql_conns + units: active connections + every: 10s + info: number of active SQL connections + to: dba + +template: cockroachdb_sql_executed_statements_total_last_5m + on: cockroachdb.sql_statements_total + lookup: sum -5m absolute of sql_query_count + units: statements + every: 10s + warn: $this == 0 AND $cockroachdb_sql_active_connections != 0 + delay: down 15m up 30s multiplier 1.5 max 1h + info: number of executed SQL statements in the last 5 minutes + to: dba diff --git a/packaging/go.d.checksums b/packaging/go.d.checksums index c0e85c460e..798558abbf 100644 --- a/packaging/go.d.checksums +++ b/packaging/go.d.checksums @@ -1,16 +1,16 @@ -f038852ab4c6fb1623384685a8d2b2d0ab85474d91303d8e6b3a670d0625f104 *config.tar.gz -2087d74c4f18cd1d5f49f5e000e0cf2f63464930e9e1164e0b903268e7e85a9f *go.d.plugin-v0.14.1.darwin-386.tar.gz -acd275d58c8ba448572b50b04b3faeefcd35be985a1155192ac77d0e383c5854 *go.d.plugin-v0.14.1.darwin-amd64.tar.gz -b8da98b28dc5a048e9bb7d187c07df69bf631738ec540847b2c194e422f21ecc *go.d.plugin-v0.14.1.freebsd-386.tar.gz -021ae15d077f3688704db91650542dfab284b5d7d3f21ff83d3ba398c7cc77af *go.d.plugin-v0.14.1.freebsd-amd64.tar.gz -ea69f36e745d92b98e8a1bea118433954e1d6aea5af8923413857ca61da02b8a *go.d.plugin-v0.14.1.freebsd-arm.tar.gz -6173c2c632ee01b911d8436c64e88df0dfff6360ff9f9662c560615557c78101 *go.d.plugin-v0.14.1.linux-386.tar.gz -641d943355b31677c4cb6d445817a17317c4cb89cb173e5ecfa8567ebcef96ef *go.d.plugin-v0.14.1.linux-amd64.tar.gz -2ec678203c5728444a8550ac5e378c74c434e5e0db6ae71dd5acc28b8ab45018 *go.d.plugin-v0.14.1.linux-arm.tar.gz -b1070000c9b853d50cce0e644b8e4602ed0c6bcdf203a25678a6f9f6554dd4e1 *go.d.plugin-v0.14.1.linux-arm64.tar.gz -c6e7574680a2281fdce764861197bb61dde5e0e6c0d24ab57bab5deb321e218d *go.d.plugin-v0.14.1.linux-mips.tar.gz -b7bdd268e485d67a60670f432fd7dca9122abbbf25d4be4706406f4e9c0efaab *go.d.plugin-v0.14.1.linux-mips64.tar.gz -dc865ffeb2cf07d89a38927bbce812b2407b0c2a84299c207c497dd77c3f9be9 *go.d.plugin-v0.14.1.linux-mips64le.tar.gz -6b8d55742dfe9f4116edd2cbca670245a3e81344ffa50fb75885b841f85b7699 *go.d.plugin-v0.14.1.linux-mipsle.tar.gz -830a6bb2028476568870d4a01725586c1799862a4eb0eb7a3bce9e2e617fb688 *go.d.plugin-v0.14.1.linux-ppc64.tar.gz -985ee3f5e24cc6cba71723e7b6acd06e49f48280007f33174b557fa8dda6daef *go.d.plugin-v0.14.1.linux-ppc64le.tar.gz +eac6cdc2f38986ba8605030b6ac41304b5f03e880fc9fea943ed034fc8f7490a *config.tar.gz +7021f071689e4efa879d557f4a76c369e3a7b95c093913ba3c5429087e093258 *go.d.plugin-v0.15.0.darwin-386.tar.gz +ac16155b37fd51c5d333e490b4e5b85e3388b3b42ae9bb5bc828f78aa1cbd58a *go.d.plugin-v0.15.0.darwin-amd64.tar.gz +5d34e399ee75db0fce858a34038b3d645c8b5c80b26c346f6908117a738899ff *go.d.plugin-v0.15.0.freebsd-386.tar.gz +d2ff775c11dcf8c90ab92e8d229a74980bb498513cc7411962cdc8056cb22eef *go.d.plugin-v0.15.0.freebsd-amd64.tar.gz +3563424c41ca047786a9ef80ac25704d27d53e7b64b8252ce30d3b54b3d1638f *go.d.plugin-v0.15.0.freebsd-arm.tar.gz +8e8e52bde2da6ce98fa902bad164152c53632fc7b1e1c9f689a89c0e5a87548f *go.d.plugin-v0.15.0.linux-386.tar.gz +292546c3338b372441816be12e13f7fe6951281c2f03cff947d9bfb0cb39aeb2 *go.d.plugin-v0.15.0.linux-amd64.tar.gz +ab5fb4d2f277255de31ca9330aacb67ebab2f10c398dc96f207eefefae1960ce *go.d.plugin-v0.15.0.linux-arm.tar.gz +93ebd48c2b781fb42a26e21759885772d08e3ee2eea46b12e10681ff6c914de6 *go.d.plugin-v0.15.0.linux-arm64.tar.gz +c83e8c758b116c13184314158ed5e7516fa4467a50e43b7d30bd466938e1a0c7 *go.d.plugin-v0.15.0.linux-mips.tar.gz +7a036e6e74ac13b82a6baedf61208a6eae6dc1b57da50ad47b2fc5a376ef680a *go.d.plugin-v0.15.0.linux-mips64.tar.gz +8f5a92bc4feac4ae44c0881e0de4490643fccc2d7e0867de437e0d08fc858256 *go.d.plugin-v0.15.0.linux-mips64le.tar.gz +5a87a29f6a723d7bdc063e767c20c377cb8383edca96f36a3ed45d3434b7b157 *go.d.plugin-v0.15.0.linux-mipsle.tar.gz +b67f5ed415c8f2109c916f655c60d2d61cb520623065bee770941bf8f40af1cc *go.d.plugin-v0.15.0.linux-ppc64.tar.gz +69ab1728f6017e3e83db5971a6e57dabdb5b9190ae1d817ee9b010bc0a2995a0 *go.d.plugin-v0.15.0.linux-ppc64le.tar.gz diff --git a/packaging/go.d.version b/packaging/go.d.version index 64a3b7907b..86dd09abce 100644 --- a/packaging/go.d.version +++ b/packaging/go.d.version @@ -1 +1 @@ -v0.14.1 +v0.15.0 diff --git a/web/gui/dashboard_info.js b/web/gui/dashboard_info.js index 7032074b7e..b86841653c 100644 --- a/web/gui/dashboard_info.js +++ b/web/gui/dashboard_info.js @@ -534,6 +534,12 @@ netdataDashboard.menu = { title: 'Squid log', icon: '<i class="fas fa-file-alt"></i>', info: undefined + }, + + 'cockroachdb': { + title: 'CockroachDB', + icon: '<i class="fas fa-database"></i>', + info: 'Performance and health statistics for various <code>CockroachDB</code> components.' } }; @@ -2828,6 +2834,182 @@ netdataDashboard.context = { 'squidlog.mime_type_requests': { info: 'The content type of the object as seen in the HTTP reply header. Please note that ICP exchanges usually don\'t have any content type.' - } + }, + + // ------------------------------------------------------------------------ + // CockroachDB + + 'cockroachdb.process_cpu_time_combined_percentage': { + info: 'Current combined cpu utilization, calculated as <code>(user+system)/num of logical cpus</code>.' + }, + + 'cockroachdb.host_disk_bandwidth': { + info: 'Summary disk bandwidth statistics across all system host disks.' + }, + + 'cockroachdb.host_disk_operations': { + info: 'Summary disk operations statistics across all system host disks.' + }, + + 'cockroachdb.host_disk_iops_in_progress': { + info: 'Summary disk iops in progress statistics across all system host disks.' + }, + + 'cockroachdb.host_network_bandwidth': { + info: 'Summary network bandwidth statistics across all system host network interfaces.' + }, + + 'cockroachdb.host_network_packets': { + info: 'Summary network packets statistics across all system host network interfaces.' + }, + + 'cockroachdb.live_nodes': { + info: 'Will be <code>0</code> if this node is not itself live.' + }, + + 'cockroachdb.total_storage_capacity': { + info: 'Entire disk capacity. It includes non-CR data, CR data, and empty space.' + }, + + 'cockroachdb.storage_capacity_usability': { + info: '<code>usable</code> is sum of empty space and CR data, <code>unusable</code> is space used by non-CR data.' + }, + + 'cockroachdb.storage_usable_capacity': { + info: 'Breakdown of <code>usable</code> space.' + }, + + 'cockroachdb.storage_used_capacity_percentage': { + info: '<code>total</code> is % of <b>total</b> space used, <code>usable</code> is % of <b>usable</b> space used.' + }, + + 'cockroachdb.sql_bandwidth': { + info: 'The total amount of SQL client network traffic.' + }, + + 'cockroachdb.sql_errors': { + info: '<code>statement</code> is statements resulting in a planning or runtime error, ' + + '<code>transaction</code> is SQL transactions abort errors.' + }, + + 'cockroachdb.sql_started_ddl_statements': { + info: 'The amount of <b>started</b> DDL (Data Definition Language) statements. ' + + 'This type means database schema changes. ' + + 'It includes <code>CREATE</code>, <code>ALTER</code>, <code>DROP</code>, <code>RENAME</code>, <code>TRUNCATE</code> and <code>COMMENT</code> statements.' + }, + + 'cockroachdb.sql_executed_ddl_statements': { + info: 'The amount of <b>executed</b> DDL (Data Definition Language) statements. ' + + 'This type means database schema changes. ' + + 'It includes <code>CREATE</code>, <code>ALTER</code>, <code>DROP</code>, <code>RENAME</code>, <code>TRUNCATE</code> and <code>COMMENT</code> statements.' + }, + + 'cockroachdb.sql_started_dml_statements': { + info: 'The amount of <b>started</b> DML (Data Manipulation Language) statements.' + }, + + 'cockroachdb.sql_executed_dml_statements': { + info: 'The amount of <b>executed</b> DML (Data Manipulation Language) statements.' + }, + + 'cockroachdb.sql_started_tcl_statements': { + info: 'The amount of <b>started</b> TCL (Transaction Control Language) statements.' + }, + + 'cockroachdb.sql_executed_tcl_statements': { + info: 'The amount of <b>executed</b> TCL (Transaction Control Language) statements.' + }, + + 'cockroachdb.live_bytes': { + info: 'The amount of live data used by both applications and the CockroachDB system.' + }, + + 'cockroachdb.kv_transactions': { + info: 'KV transactions breakdown:<br>' + + '<ul>' + + ' <li><code>committed</code> committed KV transactions (including 1PC).</li>' + + ' <li><code>fast-path_committed</code> KV transaction on-phase commit attempts.</li>' + + ' <li><code>aborted</code> aborted KV transactions.</li>' + + ' </ul>' + }, + + 'cockroachdb.kv_transaction_restarts': { + info: 'KV transactions restarts breakdown:<br>' + + '<ul>' + + ' <li><code>write too old</code> restarts due to a concurrent writer committing first.</li>' + + ' <li><code>write too old (multiple)</code> restarts due to multiple concurrent writers committing first.</li>' + + ' <li><code>forwarded timestamp (iso=serializable)</code> restarts due to a forwarded commit timestamp and isolation=SERIALIZABLE".</li>' + + ' <li><code>possible replay</code> restarts due to possible replays of command batches at the storage layer.</li>' + + ' <li><code>async consensus failure</code> restarts due to async consensus writes that failed to leave intents.</li>' + + ' <li><code>read within uncertainty interval</code> restarts due to reading a new value within the uncertainty interval.</li>' + + ' <li><code>aborted</code> restarts due to an abort by a concurrent transaction (usually due to deadlock).</li>' + + ' <li><code>push failure</code> restarts due to a transaction push failure.</li>' + + ' <li><code>unknown</code> restarts due to a unknown reasons.</li>' + + ' </ul>' + }, + + 'cockroachdb.ranges': { + info: 'CockroachDB stores all user data (tables, indexes, etc.) and almost all system data in a giant sorted map of key-value pairs. ' + + 'This keyspace is divided into "ranges", contiguous chunks of the keyspace, so that every key can always be found in a single range.' + }, + + 'cockroachdb.ranges_replication_problem': { + info: 'Ranges with not optimal number of replicas:<br>' + + '<ul>' + + ' <li><code>unavailable</code> ranges with fewer live replicas than needed for quorum.</li>' + + ' <li><code>under replicated</code> ranges with fewer live replicas than the replication target.</li>' + + ' <li><code>over replicated</code> ranges with more live replicas than the replication target.</li>' + + ' </ul>' + }, + + 'cockroachdb.replicas': { + info: 'CockroachDB replicates each range (3 times by default) and stores each replica on a different node.' + }, + + 'cockroachdb.replicas_leaders': { + info: 'For each range, one of the replicas is the <code>leader</code> for write requests, <code>not leaseholders</code> is the number of Raft leaders whose range lease is held by another store.' + }, + + 'cockroachdb.replicas_leaseholders': { + info: 'For each range, one of the replicas holds the "range lease". This replica, referred to as the <code>leaseholder</code>, is the one that receives and coordinates all read and write requests for the range.' + }, + + 'cockroachdb.queue_processing_failures': { + info: 'Failed replicas breakdown by queue:<br>' + + '<ul>' + + ' <li><code>gc</code> replicas which failed processing in the GC queue.</li>' + + ' <li><code>replica gc</code> replicas which failed processing in the replica GC queue.</li>' + + ' <li><code>replication</code> replicas which failed processing in the replicate queue.</li>' + + ' <li><code>split</code> replicas which failed processing in the split queue.</li>' + + ' <li><code>consistency</code> replicas which failed processing in the consistency checker queue.</li>' + + ' <li><code>raft log</code> replicas which failed processing in the Raft log queue.</li>' + + ' <li><code>raft snapshot</code> replicas which failed processing in the Raft repair queue.</li>' + + ' <li><code>time series maintenance</code> replicas which failed processing in the time series maintenance queue.</li>' + + ' </ul>' + }, + + 'cockroachdb.rebalancing_queries': { + info: 'Number of kv-level requests received per second by the store, averaged over a large time period as used in rebalancing decisions.' + }, + + 'cockroachdb.rebalancing_writes': { + info: 'Number of keys written (i.e. applied by raft) per second to the store, averaged over a large time period as used in rebalancing decisions.' + }, + + 'cockroachdb.slow_requests': { + info: 'Requests that have been stuck for a long time.' + }, + + 'cockroachdb.timeseries_samples': { + info: 'The amount of metric samples written to disk.' + }, + + 'cockroachdb.timeseries_write_errors': { + info: 'The amount of errors encountered while attempting to write metrics to disk.' + }, + + 'cockroachdb.timeseries_write_bytes': { + info: 'Size of metric samples written to disk.' + }, }; |