Merge "Add statsd metrics for ansible runs"
This commit is contained in:
commit
93d62f8d71
@ -1,4 +1,7 @@
|
|||||||
iptables_extra_allowed_hosts:
|
iptables_extra_allowed_hosts:
|
||||||
|
- hostname: bridge.openstack.org
|
||||||
|
port: 8125
|
||||||
|
protocol: udp
|
||||||
- hostname: git.openstack.org
|
- hostname: git.openstack.org
|
||||||
port: 8125
|
port: 8125
|
||||||
protocol: udp
|
protocol: udp
|
||||||
|
@ -13,7 +13,7 @@
|
|||||||
cron:
|
cron:
|
||||||
name: run_all.sh
|
name: run_all.sh
|
||||||
state: present
|
state: present
|
||||||
job: 'flock -n /var/run/ansible/run_all.lock bash /opt/system-config/run_all.sh >> /var/log/ansible/run_all_cron.log 2>&1'
|
job: 'flock -n /var/run/ansible/run_all.lock bash /opt/system-config/run_all.sh -c >> /var/log/ansible/run_all_cron.log 2>&1'
|
||||||
minute: "{{ update_cron_interval.minute }}"
|
minute: "{{ update_cron_interval.minute }}"
|
||||||
hour: "{{ update_cron_interval.hour }}"
|
hour: "{{ update_cron_interval.hour }}"
|
||||||
day: "{{ update_cron_interval.day }}"
|
day: "{{ update_cron_interval.day }}"
|
||||||
|
54
run_all.sh
54
run_all.sh
@ -22,6 +22,41 @@ set -e
|
|||||||
SYSTEM_CONFIG=/opt/system-config
|
SYSTEM_CONFIG=/opt/system-config
|
||||||
ANSIBLE_PLAYBOOKS=$SYSTEM_CONFIG/playbooks
|
ANSIBLE_PLAYBOOKS=$SYSTEM_CONFIG/playbooks
|
||||||
|
|
||||||
|
# We only send stats if running under cron
|
||||||
|
UNDER_CRON=0
|
||||||
|
|
||||||
|
while getopts ":c" arg; do
|
||||||
|
case $arg in
|
||||||
|
c)
|
||||||
|
UNDER_CRON=1
|
||||||
|
;;
|
||||||
|
esac
|
||||||
|
done
|
||||||
|
|
||||||
|
GLOBAL_START_TIME=$(date '+%s')
|
||||||
|
|
||||||
|
# Send a timer stat to statsd
|
||||||
|
# send_timer metric [start_time]
|
||||||
|
# * uses timer metric bridge.ansible.run_all.<$1>
|
||||||
|
# * time will be taken from last call of start_timer, or $2 if set
|
||||||
|
function send_timer {
|
||||||
|
# Only send stats under cron conditions
|
||||||
|
if [[ ${UNDER_CRON} != 1 ]]; then
|
||||||
|
return
|
||||||
|
fi
|
||||||
|
|
||||||
|
local current=$(date '+%s')
|
||||||
|
local name=$1
|
||||||
|
local start=${2-$_START_TIME}
|
||||||
|
local elapsed_ms=$(( (current - start) * 1000 ))
|
||||||
|
|
||||||
|
echo "bridge.ansible.run_all.${name}:${elapsed_ms}|ms" | nc -w 1 -u graphite.openstack.org 8125
|
||||||
|
}
|
||||||
|
# See send_timer
|
||||||
|
function start_timer {
|
||||||
|
_START_TIME=$(date '+%s')
|
||||||
|
}
|
||||||
|
|
||||||
echo "--- begin run @ $(date -Is) ---"
|
echo "--- begin run @ $(date -Is) ---"
|
||||||
|
|
||||||
# It's possible for connectivity to a server or manifest application to break
|
# It's possible for connectivity to a server or manifest application to break
|
||||||
@ -33,24 +68,43 @@ set +e
|
|||||||
# stuck if they are oomkilled
|
# stuck if they are oomkilled
|
||||||
|
|
||||||
# Clone system-config and install modules and roles
|
# Clone system-config and install modules and roles
|
||||||
|
start_timer
|
||||||
timeout -k 2m 120m ansible-playbook ${ANSIBLE_PLAYBOOKS}/update-system-config.yaml
|
timeout -k 2m 120m ansible-playbook ${ANSIBLE_PLAYBOOKS}/update-system-config.yaml
|
||||||
|
send_timer update_system_config
|
||||||
|
|
||||||
# Update the code on bridge
|
# Update the code on bridge
|
||||||
|
start_timer
|
||||||
timeout -k 2m 120m ansible-playbook ${ANSIBLE_PLAYBOOKS}/bridge.yaml
|
timeout -k 2m 120m ansible-playbook ${ANSIBLE_PLAYBOOKS}/bridge.yaml
|
||||||
|
send_timer bridge
|
||||||
|
|
||||||
# Run the base playbook everywhere
|
# Run the base playbook everywhere
|
||||||
|
start_timer
|
||||||
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/base.yaml
|
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/base.yaml
|
||||||
|
send_timer base
|
||||||
|
|
||||||
# Update the puppet version
|
# Update the puppet version
|
||||||
|
start_timer
|
||||||
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/update_puppet_version.yaml
|
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/update_puppet_version.yaml
|
||||||
|
send_timer update_puppet_version
|
||||||
|
|
||||||
# Run the git/gerrit/zuul sequence, since it's important that they all work together
|
# Run the git/gerrit/zuul sequence, since it's important that they all work together
|
||||||
|
start_timer
|
||||||
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/remote_puppet_git.yaml
|
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/remote_puppet_git.yaml
|
||||||
|
send_timer git
|
||||||
|
|
||||||
# Run AFS changes separately so we can make sure to only do one at a time
|
# Run AFS changes separately so we can make sure to only do one at a time
|
||||||
# (turns out quorum is nice to have)
|
# (turns out quorum is nice to have)
|
||||||
|
start_timer
|
||||||
timeout -k 2m 120m ansible-playbook -f 1 ${ANSIBLE_PLAYBOOKS}/remote_puppet_afs.yaml
|
timeout -k 2m 120m ansible-playbook -f 1 ${ANSIBLE_PLAYBOOKS}/remote_puppet_afs.yaml
|
||||||
|
send_timer afs
|
||||||
|
|
||||||
# Run everything else. We do not care if the other things worked
|
# Run everything else. We do not care if the other things worked
|
||||||
|
start_timer
|
||||||
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/remote_puppet_else.yaml
|
timeout -k 2m 120m ansible-playbook -f 50 ${ANSIBLE_PLAYBOOKS}/remote_puppet_else.yaml
|
||||||
|
send_timer else
|
||||||
|
|
||||||
|
# Send the combined time for everything
|
||||||
|
send_timer total $GLOBAL_START_TIME
|
||||||
|
|
||||||
echo "--- end run @ $(date -Is) ---"
|
echo "--- end run @ $(date -Is) ---"
|
||||||
echo
|
echo
|
||||||
|
Loading…
x
Reference in New Issue
Block a user