X-Git-Url: https://git.arvados.org/arvados.git/blobdiff_plain/0a3d7a02236cbec448203a1b2218b5e0630d1c00..ad00c515d3a34a8247a08be5a332470f8563086c:/doc/admin/metrics.html.textile.liquid?ds=sidebyside diff --git a/doc/admin/metrics.html.textile.liquid b/doc/admin/metrics.html.textile.liquid index 107431267e..1d6b87da62 100644 --- a/doc/admin/metrics.html.textile.liquid +++ b/doc/admin/metrics.html.textile.liquid @@ -10,72 +10,47 @@ Copyright (C) The Arvados Authors. All rights reserved. SPDX-License-Identifier: CC-BY-SA-3.0 {% endcomment %} -Metrics endpoints are found at @/status.json@ on many Arvados services. The purpose of metrics are to provide statistics about the operation of a service, suitable for diagnosing how well a service is performing under load. - -Metrics endpoints must be configured with a "management token":management-token.html . - -h2. Keepstore - -h3. Root - -table(table table-bordered table-condensed). -|_. Attribute|_. Type|_. Description| -|Volumes| array of "volumeStatusEnt":#volumeStatusEnt || -|BufferPool| "PoolStatus":#PoolStatus || -|PullQueue| "WorkQueueStatus":#WorkQueueStatus || -|TrashQueue| "WorkQueueStatus":#WorkQueueStatus || -|RequestsCurrent| int || -|RequestsMax| int || -|Version| string || - -h3(#volumeStatusEnt). volumeStatusEnt - -table(table table-bordered table-condensed). -|_. Attribute|_. Type|_. Description| -|Label| string|| -|Status| "VolumeStatus":#VolumeStatus || -|VolumeStats| "ioStats":#ioStats || - -h3(#VolumeStatus). VolumeStatus - -table(table table-bordered table-condensed). -|_. Attribute|_. Type|_. Description| -|MountPoint| string|| -|DeviceNum| uint64|| -|BytesFree| uint64|| -|BytesUsed| uint64|| - -h3(#ioStats). ioStats - -table(table table-bordered table-condensed). -|_. Attribute|_. Type|_. Description| -|Errors| uint64|| -|Ops| uint64|| -|CompareOps| uint64|| -|GetOps| uint64|| -|PutOps| uint64|| -|TouchOps| uint64|| -|InBytes| uint64|| -|OutBytes| uint64|| - -h3(#PoolStatus). PoolStatus - -table(table table-bordered table-condensed). -|_. Attribute|_. Type|_. Description| -|BytesAllocatedCumulative| uint64|| -|BuffersMax| int|| -|BuffersInUse| int|| - -h3(#WorkQueueStatus). WorkQueueStatus - -table(table table-bordered table-condensed). -|_. Attribute|_. Type|_. Description| -|InProgress| int|| -|Queued| int|| +Some Arvados services publish Prometheus/OpenMetrics-compatible metrics at @/metrics@. Metrics can help you understand how components perform under load, find performance bottlenecks, and detect and diagnose problems. + +To access metrics endpoints, services must be configured with a "management token":management-token.html. When accessing a metrics endpoint, prefix the management token with @"Bearer "@ and supply it in the @Authorization@ request header. + +
curl -sfH "Authorization: Bearer your_management_token_goes_here" "https://0.0.0.0:25107/metrics"
+
+ +The plain text export format includes "help" messages with a description of each reported metric. + +When configuring Prometheus, use a @bearer_token@ or @bearer_token_file@ option to authenticate requests. + +
scrape_configs:
+  - job_name: keepstore
+    bearer_token: your_management_token_goes_here
+    static_configs:
+    - targets:
+      - "keep0.ClusterID.example.com:25107"
+
+ +table(table table-bordered table-condensed table-hover). +|_. Component|_. Metrics endpoint| +|arvados-api-server|| +|arvados-controller|✓| +|arvados-dispatch-cloud|✓| +|arvados-git-httpd|| +|arvados-node-manager|| +|arvados-ws|✓| +|composer|| +|keepproxy|| +|keepstore|✓| +|keep-balance|✓| +|keep-web|✓| +|workbench1|| +|workbench2|| h2. Node manager -The node manager status end point provides a snapshot of internal status at the time of the most recent wishlist update. +The node manager does not export prometheus-style metrics, but its @/status.json@ endpoint provides a snapshot of internal status at the time of the most recent wishlist update. + +
curl -sfH "Authorization: Bearer your_management_token_goes_here" "http://0.0.0.0:8989/status.json"
+
table(table table-bordered table-condensed). |_. Attribute|_. Type|_. Description| @@ -89,3 +64,28 @@ table(table table-bordered table-condensed). |nodes_wish|int|Number of nodes in the current wishlist| |node_quota|int|Current node count ceiling due to cloud quota limits| |config_max_nodes|int|Configured max node count| + +h3. Example + +
+{
+  "actor_exceptions": 0,
+  "idle_times": {
+    "compute1": 0,
+    "compute3": 0,
+    "compute2": 0,
+    "compute4": 0
+  },
+  "create_node_errors": 0,
+  "destroy_node_errors": 0,
+  "nodes_idle": 0,
+  "config_max_nodes": 8,
+  "list_nodes_errors": 0,
+  "node_quota": 8,
+  "Version": "1.1.4.20180719160944",
+  "nodes_wish": 0,
+  "nodes_unpaired": 0,
+  "nodes_busy": 4,
+  "boot_failures": 0
+}
+