CFME-collectd/dashbaord fixes.
+ Correctly collect on evm:dbsync:replicate, and appliance_console.rb + Fix Ansible 2.0 depreciation + Improve visualization of IOPs/Throughput per cfme process component of dashboard + Improve visualization of CFME Per Process CPU Utilization, 100% represents 100% cpu of a single core rather than all cpu resources. Change-Id: I35b5419c32c03e8f8cf1b1c7667ab9b1597997d8
This commit is contained in:
parent
8aeb443df9
commit
121525e4e6
@ -185,8 +185,8 @@ LoadPlugin uptime
|
|||||||
# Appliance processes
|
# Appliance processes
|
||||||
ProcessMatch "evm_server.rb" ".*evm_server\.rb$"
|
ProcessMatch "evm_server.rb" ".*evm_server\.rb$"
|
||||||
ProcessMatch "evm_watchdog.rb" "/bin/evm_watchdog.rb"
|
ProcessMatch "evm_watchdog.rb" "/bin/evm_watchdog.rb"
|
||||||
Process "evm:dbsync:replicate"
|
ProcessMatch "evm:dbsync:replicate" ".*evm:dbsync:replicate$"
|
||||||
Process "appliance_console.rb"
|
ProcessMatch "appliance_console.rb" ".*appliance_console.rb$"
|
||||||
|
|
||||||
# Workers
|
# Workers
|
||||||
ProcessMatch "MiqEventHandler" ".*MiqEventHandler.*"
|
ProcessMatch "MiqEventHandler" ".*MiqEventHandler.*"
|
||||||
|
@ -185,8 +185,8 @@ LoadPlugin uptime
|
|||||||
# Appliance processes
|
# Appliance processes
|
||||||
ProcessMatch "evm_server.rb" ".*evm_server\.rb$"
|
ProcessMatch "evm_server.rb" ".*evm_server\.rb$"
|
||||||
ProcessMatch "evm_watchdog.rb" "/bin/evm_watchdog.rb"
|
ProcessMatch "evm_watchdog.rb" "/bin/evm_watchdog.rb"
|
||||||
Process "evm:dbsync:replicate"
|
ProcessMatch "evm:dbsync:replicate" ".*evm:dbsync:replicate$"
|
||||||
Process "appliance_console.rb"
|
ProcessMatch "appliance_console.rb" ".*appliance_console.rb$"
|
||||||
|
|
||||||
# Workers
|
# Workers
|
||||||
ProcessMatch "MiqEventHandler" ".*MiqEventHandler.*"
|
ProcessMatch "MiqEventHandler" ".*MiqEventHandler.*"
|
||||||
|
@ -67,8 +67,8 @@ LoadPlugin uptime
|
|||||||
# Appliance processes
|
# Appliance processes
|
||||||
ProcessMatch "evm_server.rb" ".*evm_server\.rb$"
|
ProcessMatch "evm_server.rb" ".*evm_server\.rb$"
|
||||||
ProcessMatch "evm_watchdog.rb" "/bin/evm_watchdog.rb"
|
ProcessMatch "evm_watchdog.rb" "/bin/evm_watchdog.rb"
|
||||||
Process "evm:dbsync:replicate"
|
ProcessMatch "evm:dbsync:replicate" ".*evm:dbsync:replicate$"
|
||||||
Process "appliance_console.rb"
|
ProcessMatch "appliance_console.rb" ".*appliance_console.rb$"
|
||||||
|
|
||||||
# Workers
|
# Workers
|
||||||
ProcessMatch "MiqEventHandler" ".*MiqEventHandler.*"
|
ProcessMatch "MiqEventHandler" ".*MiqEventHandler.*"
|
||||||
|
@ -6,7 +6,7 @@
|
|||||||
- name: Remove existing dashboards
|
- name: Remove existing dashboards
|
||||||
command: "curl -X DELETE -H 'Content-Type: application/json' http://{{grafana_username}}:{{grafana_password}}@{{grafana_host}}:{{grafana_port}}/api/dashboards/db/{{item.process_list_name|lower}}-general-system-performance"
|
command: "curl -X DELETE -H 'Content-Type: application/json' http://{{grafana_username}}:{{grafana_password}}@{{grafana_host}}:{{grafana_port}}/api/dashboards/db/{{item.process_list_name|lower}}-general-system-performance"
|
||||||
when: overwrite_existing
|
when: overwrite_existing
|
||||||
with_items: dashboards
|
with_items: "{{dashboards}}"
|
||||||
|
|
||||||
- name: Ensure {{role_path}}/files directory exists
|
- name: Ensure {{role_path}}/files directory exists
|
||||||
file: path={{role_path}}/files state=directory
|
file: path={{role_path}}/files state=directory
|
||||||
@ -15,12 +15,12 @@
|
|||||||
template:
|
template:
|
||||||
src: "{{item.template_name}}_general_system_performance.json.j2"
|
src: "{{item.template_name}}_general_system_performance.json.j2"
|
||||||
dest: "{{role_path}}/files/{{item.process_list_name}}_general_system_performance.json"
|
dest: "{{role_path}}/files/{{item.process_list_name}}_general_system_performance.json"
|
||||||
with_items: dashboards
|
with_items: "{{dashboards}}"
|
||||||
|
|
||||||
- name: Upload dashboards to grafana
|
- name: Upload dashboards to grafana
|
||||||
command: "curl -X POST -H 'Content-Type: application/json' -d @{{role_path}}/files/{{item.process_list_name}}_general_system_performance.json http://{{grafana_username}}:{{grafana_password}}@{{grafana_host}}:{{grafana_port}}/api/dashboards/db"
|
command: "curl -X POST -H 'Content-Type: application/json' -d @{{role_path}}/files/{{item.process_list_name}}_general_system_performance.json http://{{grafana_username}}:{{grafana_password}}@{{grafana_host}}:{{grafana_port}}/api/dashboards/db"
|
||||||
with_items: dashboards
|
with_items: "{{dashboards}}"
|
||||||
|
|
||||||
- name: Remove leftover json file(s)
|
- name: Remove leftover json file(s)
|
||||||
file: path={{role_path}}/files/{{item.process_list_name}}_general_system_performance.json state=absent
|
file: path={{role_path}}/files/{{item.process_list_name}}_general_system_performance.json state=absent
|
||||||
with_items: dashboards
|
with_items: "{{dashboards}}"
|
||||||
|
@ -1890,7 +1890,7 @@
|
|||||||
"lines": true,
|
"lines": true,
|
||||||
"linewidth": 2,
|
"linewidth": 2,
|
||||||
"links": [],
|
"links": [],
|
||||||
"nullPointMode": "connected",
|
"nullPointMode": "{{metrics.nullPointMode}}",
|
||||||
"percentage": false,
|
"percentage": false,
|
||||||
"pointradius": 5,
|
"pointradius": 5,
|
||||||
"points": false,
|
"points": false,
|
||||||
@ -1901,20 +1901,12 @@
|
|||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{% if vars.update({'temp_count': 0}) %} {% endif %}
|
{% if vars.update({'temp_count': 0}) %} {% endif %}
|
||||||
{% if metrics.name|match('Process CPU') %}
|
|
||||||
{
|
|
||||||
"hide": true,
|
|
||||||
"refId": "{{vars.temp_count|to_grafana_refid}}",
|
|
||||||
"target": "alias(sumSeries(offset(scale($Cloud.$Node.cpu-*.cpu-idle, 0), 1)), 'cores')"
|
|
||||||
},
|
|
||||||
{% if vars.update({'temp_count': (vars.temp_count + 1)}) %} {% endif %}
|
|
||||||
{% endif %}
|
|
||||||
{% for process in panel.processes %}
|
{% for process in panel.processes %}
|
||||||
{% for metric in metrics.metrics %}
|
{% for metric in metrics.metrics %}
|
||||||
{
|
{
|
||||||
"refId": "{{vars.temp_count|to_grafana_refid}}",
|
"refId": "{{vars.temp_count|to_grafana_refid}}",
|
||||||
{% if metrics.name|match('Process CPU') %}
|
{% if metrics.name|match('Process CPU') %}
|
||||||
"target": "alias(divideSeries(scale($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, 0.0001), #A), '{{process}} {{metric.name}}')"
|
"target": "alias(scale($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, 0.0001), '{{process}} {{metric.name}}')"
|
||||||
{% else %}
|
{% else %}
|
||||||
"target": "alias($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, '{{process}} {{metric.name}}')"
|
"target": "alias($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, '{{process}} {{metric.name}}')"
|
||||||
{% endif %}
|
{% endif %}
|
||||||
|
@ -1890,7 +1890,7 @@
|
|||||||
"lines": true,
|
"lines": true,
|
||||||
"linewidth": 2,
|
"linewidth": 2,
|
||||||
"links": [],
|
"links": [],
|
||||||
"nullPointMode": "connected",
|
"nullPointMode": "{{metrics.nullPointMode}}",
|
||||||
"percentage": false,
|
"percentage": false,
|
||||||
"pointradius": 5,
|
"pointradius": 5,
|
||||||
"points": false,
|
"points": false,
|
||||||
@ -1901,20 +1901,12 @@
|
|||||||
"steppedLine": false,
|
"steppedLine": false,
|
||||||
"targets": [
|
"targets": [
|
||||||
{% if vars.update({'temp_count': 0}) %} {% endif %}
|
{% if vars.update({'temp_count': 0}) %} {% endif %}
|
||||||
{% if metrics.name|match('Process CPU') %}
|
|
||||||
{
|
|
||||||
"hide": true,
|
|
||||||
"refId": "{{vars.temp_count|to_grafana_refid}}",
|
|
||||||
"target": "alias(sumSeries(offset(scale($Cloud.$Node.cpu-*.cpu-idle, 0), 1)), 'cores')"
|
|
||||||
},
|
|
||||||
{% if vars.update({'temp_count': (vars.temp_count + 1)}) %} {% endif %}
|
|
||||||
{% endif %}
|
|
||||||
{% for process in panel.processes %}
|
{% for process in panel.processes %}
|
||||||
{% for metric in metrics.metrics %}
|
{% for metric in metrics.metrics %}
|
||||||
{
|
{
|
||||||
"refId": "{{vars.temp_count|to_grafana_refid}}",
|
"refId": "{{vars.temp_count|to_grafana_refid}}",
|
||||||
{% if metrics.name|match('Process CPU') %}
|
{% if metrics.name|match('Process CPU') %}
|
||||||
"target": "alias(divideSeries(scale($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, 0.0001), #A), '{{process}} {{metric.name}}')"
|
"target": "alias(scale($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, 0.0001), '{{process}} {{metric.name}}')"
|
||||||
{% else %}
|
{% else %}
|
||||||
"target": "alias($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, '{{process}} {{metric.name}}')"
|
"target": "alias($Cloud.$Node.processes-{{process|replace('.', '_')|replace(':', '_')}}{{metric.query}}, '{{process}} {{metric.name}}')"
|
||||||
{% endif %}
|
{% endif %}
|
||||||
|
@ -11,6 +11,7 @@ per_process_metrics:
|
|||||||
query: ".ps_count.processes"
|
query: ".ps_count.processes"
|
||||||
- name: "Threads"
|
- name: "Threads"
|
||||||
query: ".ps_count.threads"
|
query: ".ps_count.threads"
|
||||||
|
nullPointMode: "connected"
|
||||||
- name: "Process CPU"
|
- name: "Process CPU"
|
||||||
y1units: "percent"
|
y1units: "percent"
|
||||||
metrics:
|
metrics:
|
||||||
@ -18,6 +19,7 @@ per_process_metrics:
|
|||||||
query: ".ps_cputime.syst"
|
query: ".ps_cputime.syst"
|
||||||
- name: "User"
|
- name: "User"
|
||||||
query: ".ps_cputime.user"
|
query: ".ps_cputime.user"
|
||||||
|
nullPointMode: "connected"
|
||||||
- name: "Process Memory"
|
- name: "Process Memory"
|
||||||
y1units: "bits"
|
y1units: "bits"
|
||||||
metrics:
|
metrics:
|
||||||
@ -25,6 +27,7 @@ per_process_metrics:
|
|||||||
query: ".ps_rss"
|
query: ".ps_rss"
|
||||||
- name: "Virtual"
|
- name: "Virtual"
|
||||||
query: ".ps_vm"
|
query: ".ps_vm"
|
||||||
|
nullPointMode: "connected"
|
||||||
- name: "Process Page Faults"
|
- name: "Process Page Faults"
|
||||||
y1units: "short"
|
y1units: "short"
|
||||||
metrics:
|
metrics:
|
||||||
@ -32,6 +35,7 @@ per_process_metrics:
|
|||||||
query: ".ps_pagefaults.majflt"
|
query: ".ps_pagefaults.majflt"
|
||||||
- name: "Minflt"
|
- name: "Minflt"
|
||||||
query: ".ps_pagefaults.minflt"
|
query: ".ps_pagefaults.minflt"
|
||||||
|
nullPointMode: "connected"
|
||||||
- name: "Process IOPs(Estimated via SYSCALLS)"
|
- name: "Process IOPs(Estimated via SYSCALLS)"
|
||||||
y1units: "iops"
|
y1units: "iops"
|
||||||
metrics:
|
metrics:
|
||||||
@ -39,6 +43,7 @@ per_process_metrics:
|
|||||||
query: ".ps_disk_ops.read"
|
query: ".ps_disk_ops.read"
|
||||||
- name: "Write"
|
- name: "Write"
|
||||||
query: ".ps_disk_ops.write"
|
query: ".ps_disk_ops.write"
|
||||||
|
nullPointMode: "null"
|
||||||
- name: "Process IO Throughput(Estimated via SYSCALLS)"
|
- name: "Process IO Throughput(Estimated via SYSCALLS)"
|
||||||
y1units: "bytes"
|
y1units: "bytes"
|
||||||
metrics:
|
metrics:
|
||||||
@ -46,6 +51,7 @@ per_process_metrics:
|
|||||||
query: ".ps_disk_octets.read"
|
query: ".ps_disk_octets.read"
|
||||||
- name: "Write"
|
- name: "Write"
|
||||||
query: ".ps_disk_octets.write"
|
query: ".ps_disk_octets.write"
|
||||||
|
nullPointMode: "null"
|
||||||
|
|
||||||
per_process_panels:
|
per_process_panels:
|
||||||
Baremetal:
|
Baremetal:
|
||||||
|
Loading…
x
Reference in New Issue
Block a user