project-config/grafana/nodepool-ovh.yaml
David Moreau-Simard a281b06c27
Update Nodepool graphite metric names
Following the update to Zuul v3 some things changed:
- nodes.delete became nodes.deleting
- nodes.used became nodes.in-use but nodes.used is still relevant
  as it's the status between 'in-use' and 'deleting'
- Add a panel for displaying failed nodes

Change-Id: I240d082115bd9078e45984d8fcff212a4e40e842
Depends-On: I6a89752d74ed7424267c3af3937ad01fb4bb8f86
2017-10-02 10:31:52 -04:00

189 lines
7.3 KiB
YAML

dashboard:
title: 'Nodepool: OVH'
rows:
- title: Description
height: 100px
panels:
- title: Description
content: |
**This dashboard is managed by [Grafyaml](http://docs.openstack.org/infra/system-config/grafyaml.html).**
If you would like to make changes to this dashboard, please see the grafana directory in [project-config](https://git.openstack.org/cgit/openstack-infra/project-config/tree/grafana/nodepool-ovh.yaml).
type: text
- title: Nodes
showTitle: true
height: 150px
panels:
- title: Building
span: 3
sparkline:
full: true
show: true
targets:
- target: sumSeries(stats.gauges.nodepool.provider.ovh-*.nodes.building)
type: singlestat
valueName: current
- title: Ready
span: 3
sparkline:
full: true
show: true
targets:
- target: sumSeries(stats.gauges.nodepool.provider.ovh-*.nodes.ready)
type: singlestat
valueName: current
- title: In Use
span: 3
sparkline:
full: true
show: true
targets:
- target: sumSeries(stats.gauges.nodepool.provider.ovh-*.nodes.in-use)
type: singlestat
valueName: current
- title: Deleting
span: 3
sparkline:
full: true
show: true
targets:
- target: sumSeries(stats.gauges.nodepool.provider.ovh-*.nodes.deleting)
type: singlestat
valueName: current
- title: API Operations
showTitle: true
height: 250px
panels:
- title: Create Server
type: graph
span: 4
leftYAxisLabel: "time"
y_formats:
- s
- none
targets:
- target: alias(scale(stats.timers.nodepool.task.ovh-bhs1.ComputePostServers.mean, '0.001'), 'BHS1')
- target: alias(scale(stats.timers.nodepool.task.ovh-gra1.ComputePostServers.mean, '0.001'), 'GRA1')
- title: Get Server
type: graph
span: 4
leftYAxisLabel: "time"
y_formats:
- s
- none
targets:
- target: alias(scale(stats.timers.nodepool.task.ovh-bhs1.ComputeGetServersDetail.mean, '0.001'), 'BHS1')
- target: alias(scale(stats.timers.nodepool.task.ovh-gra1.ComputeGetServersDetail.mean, '0.001'), 'GRA1')
- title: Delete Server
type: graph
span: 4
leftYAxisLabel: "time"
y_formats:
- s
- none
targets:
- target: alias(scale(stats.timers.nodepool.task.ovh-bhs1.ComputeDeleteServers.mean, '0.001'), 'BHS1')
- target: alias(scale(stats.timers.nodepool.task.ovh-gra1.ComputeDeleteServers.mean, '0.001'), 'GRA1')
- title: List Servers
type: graph
span: 4
leftYAxisLabel: "time"
y_formats:
- s
- none
targets:
- target: alias(scale(stats.timers.nodepool.task.ovh-bhs1.ComputeGetServers.mean, '0.001'), 'BHS1')
- target: alias(scale(stats.timers.nodepool.task.ovh-gra1.ComputeGetServers.mean, '0.001'), 'GRA1')
- title: Node Launches
showTitle: true
height: 250px
panels:
- title: Ready Node Launch Attempts
type: graph
span: 4
nullPointMode: null as zero
leftYAxisLabel: "events / min"
targets:
- target: alias(smartSummarize(stats_counts.nodepool.launch.provider.ovh-bhs1.ready, '1m'), 'BHS1')
- target: alias(smartSummarize(stats_counts.nodepool.launch.provider.ovh-gra1.ready, '1m'), 'GRA1')
- title: Error Node Launch Attempts
type: graph
span: 4
nullPointMode: null as zero
leftYAxisLabel: "events / min"
targets:
- target: alias(smartSummarize(sumSeries(stats_counts.nodepool.launch.provider.ovh-bhs1.error.*), '1m'), 'BHS1')
- target: alias(smartSummarize(sumSeries(stats_counts.nodepool.launch.provider.ovh-gra1.error.*), '1m'), 'GRA1')
- title: Time to Ready
type: graph
span: 4
leftYAxisLabel: "time"
y_formats:
- s
- none
targets:
- target: alias(scale(stats.timers.nodepool.launch.provider.ovh-bhs1.ready.mean, '0.001'), 'BHS1')
- target: alias(scale(stats.timers.nodepool.launch.provider.ovh-gra1.ready.mean, '0.001'), 'GRA1')
- title: Test Nodes (BHS1)
type: graph
span: 4
stack: true
tooltip:
value_type: individual
leftYAxisLabel: "nodes"
targets:
- target: alias(stats.gauges.nodepool.provider.ovh-bhs1.nodes.building, 'Building')
- target: alias(stats.gauges.nodepool.provider.ovh-bhs1.nodes.ready, 'Available')
- target: alias(stats.gauges.nodepool.provider.ovh-bhs1.nodes.in-use, 'In Use')
- target: alias(stats.gauges.nodepool.provider.ovh-bhs1.nodes.used, 'Used')
- target: alias(stats.gauges.nodepool.provider.ovh-bhs1.nodes.deleting, 'Deleting')
- target: alias(stats.gauges.nodepool.provider.ovh-bhs1.max_servers, 'Max')
seriesOverrides:
- alias: Max
stack: False
- title: Test Nodes (GRA1)
type: graph
span: 4
stack: true
tooltip:
value_type: individual
leftYAxisLabel: "nodes"
targets:
- target: alias(stats.gauges.nodepool.provider.ovh-gra1.nodes.building, 'Building')
- target: alias(stats.gauges.nodepool.provider.ovh-gra1.nodes.ready, 'Available')
- target: alias(stats.gauges.nodepool.provider.ovh-gra1.nodes.in-use, 'In Use')
- target: alias(stats.gauges.nodepool.provider.ovh-gra1.nodes.used, 'Used')
- target: alias(stats.gauges.nodepool.provider.ovh-gra1.nodes.deleting, 'Deleting')
- target: alias(stats.gauges.nodepool.provider.ovh-gra1.max_servers, 'Max')
seriesOverrides:
- alias: Max
stack: False
- title: Images
showTitle: true
height: 250px
panels:
- title: Image Uploads
type: graph
span: 4
leftYAxisLabel: "time"
y_formats:
- s
- none
targets:
- target: alias(scale(averageSeries(stats.timers.nodepool.image_update.*.ovh-bhs1.mean), '0.001'), 'BHS1')
- target: alias(scale(averageSeries(stats.timers.nodepool.image_update.*.ovh-gra1.mean), '0.001'), 'GRA1')
- title: Job Runtimes
showTitle: true
height: 250px
panels:
- title: gate-tempest-dsvm-neutron-full
type: graph
span: 6
leftYAxisLabel: "time"
y_formats:
- s
- none
targets:
- target: alias(scale(stats.timers.nodepool.job.gate-tempest-dsvm-neutron-full-ubuntu-xenial.master.ubuntu-xenial.ovh-bhs1.runtime.mean, '0.001'), 'BHS1')
- target: alias(scale(stats.timers.nodepool.job.gate-tempest-dsvm-neutron-full-ubuntu-xenial.master.ubuntu-xenial.ovh-gra1.runtime.mean, '0.001'), 'GRA1')