Postprocess after a workload has executed
This work is to take an results directory and find all the rally/Shaker/Perfkit JSONs and create the Elasticsearch JSONs that can be pushed to Elasticsearch. This is also a minor refactor of the Rally lib to refactor how we push results into elasticsearch. This creates a generic function so we can have file and/or taskid based metrics created + (sai) Fix way how we crawl for files + (sai) Exclude already postprocessed files + (sai) Fix filenaming of dumped postprocessed files + {sai) flake8 Co-Authored-By: Sai Sindhur Malleni <smalleni@redhat.com> Change-Id: I5ca8877f26e889856c9773b51ba38f24562a80af
This commit is contained in:
parent
ae06629d82
commit
423da4ff52
@ -41,6 +41,8 @@ def main():
|
|||||||
parser.add_argument('workloads', nargs='*', help='Browbeat workload(s). Takes a space separated'
|
parser.add_argument('workloads', nargs='*', help='Browbeat workload(s). Takes a space separated'
|
||||||
' list of workloads ({}) or \"all\"'.format(', '.join(_workload_opts)))
|
' list of workloads ({}) or \"all\"'.format(', '.join(_workload_opts)))
|
||||||
parser.add_argument('--debug', action='store_true', help='Enable Debug messages')
|
parser.add_argument('--debug', action='store_true', help='Enable Debug messages')
|
||||||
|
parser.add_argument('-p','--postprocess',
|
||||||
|
dest="path",help="Path to process, ie results/20170101/")
|
||||||
_cli_args = parser.parse_args()
|
_cli_args = parser.parse_args()
|
||||||
|
|
||||||
_logger = logging.getLogger('browbeat')
|
_logger = logging.getLogger('browbeat')
|
||||||
@ -67,6 +69,8 @@ def main():
|
|||||||
# Default to all workloads
|
# Default to all workloads
|
||||||
if _cli_args.workloads == []:
|
if _cli_args.workloads == []:
|
||||||
_cli_args.workloads.append('all')
|
_cli_args.workloads.append('all')
|
||||||
|
if _cli_args.path :
|
||||||
|
return tools.post_process(_cli_args)
|
||||||
|
|
||||||
if len(_cli_args.workloads) == 1 and 'all' in _cli_args.workloads:
|
if len(_cli_args.workloads) == 1 and 'all' in _cli_args.workloads:
|
||||||
_cli_args.workloads = _workload_opts
|
_cli_args.workloads = _workload_opts
|
||||||
|
114
lib/Rally.py
114
lib/Rally.py
@ -23,6 +23,7 @@ import shutil
|
|||||||
import time
|
import time
|
||||||
import Tools
|
import Tools
|
||||||
import WorkloadBase
|
import WorkloadBase
|
||||||
|
import json
|
||||||
|
|
||||||
|
|
||||||
class Rally(WorkloadBase.WorkloadBase):
|
class Rally(WorkloadBase.WorkloadBase):
|
||||||
@ -33,7 +34,8 @@ class Rally(WorkloadBase.WorkloadBase):
|
|||||||
self.tools = Tools.Tools(self.config)
|
self.tools = Tools.Tools(self.config)
|
||||||
self.connmon = Connmon.Connmon(self.config)
|
self.connmon = Connmon.Connmon(self.config)
|
||||||
self.grafana = Grafana.Grafana(self.config)
|
self.grafana = Grafana.Grafana(self.config)
|
||||||
self.elastic = Elastic.Elastic(self.config, self.__class__.__name__.lower())
|
self.elastic = Elastic.Elastic(
|
||||||
|
self.config, self.__class__.__name__.lower())
|
||||||
self.error_count = 0
|
self.error_count = 0
|
||||||
self.pass_count = 0
|
self.pass_count = 0
|
||||||
self.test_count = 0
|
self.test_count = 0
|
||||||
@ -125,16 +127,44 @@ class Rally(WorkloadBase.WorkloadBase):
|
|||||||
result['rally_metadata'] = meta
|
result['rally_metadata'] = meta
|
||||||
return result
|
return result
|
||||||
|
|
||||||
def json_result(self, task_id, scenario_name, run, test_name, result_dir):
|
def file_to_json(self, filename, push_to_es=False):
|
||||||
|
self.logger.info("Loading rally JSON file {} JSON".format(filename))
|
||||||
|
rally_json = self.elastic.load_json_file(filename)
|
||||||
|
errors, results = self.json_parse(rally_json)
|
||||||
|
for error in errors:
|
||||||
|
error_result = self.elastic.combine_metadata(error)
|
||||||
|
with open("{}/{}-error_index-es.json".format(os.path.dirname(filename),
|
||||||
|
os.path.basename(filename)),
|
||||||
|
'w+') as error_file:
|
||||||
|
json.dump(error_result, error_file)
|
||||||
|
for result in results:
|
||||||
|
result_doc = self.elastic.combine_metadata(result)
|
||||||
|
with open("{}/{}-result_index-es.json".format(os.path.dirname(filename),
|
||||||
|
os.path.splitext(
|
||||||
|
os.path.basename(filename))[0]),
|
||||||
|
'w+') as result_file:
|
||||||
|
json.dump(result_doc, result_file)
|
||||||
|
return errors, results
|
||||||
|
|
||||||
|
def json_parse(self, json_doc, metadata={}):
|
||||||
|
"""Function to extract data out of a json document
|
||||||
|
|
||||||
|
Args:
|
||||||
|
json_doc (json): json document to parse
|
||||||
|
metadata (dict): dict containing run specific metadata, ie rally UUID.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
errors (list) : errors contained within the json_doc
|
||||||
|
results (list) : results contained within the json_doc
|
||||||
|
"""
|
||||||
rally_data = {}
|
rally_data = {}
|
||||||
failure = False
|
errors = []
|
||||||
self.logger.info("Loading Task_ID {} JSON".format(task_id))
|
results = []
|
||||||
rally_json = self.elastic.load_json(self.gen_scenario_json(task_id))
|
if len(json_doc) < 1:
|
||||||
es_ts = datetime.datetime.utcnow()
|
self.logger.error("Issue with JSON document")
|
||||||
if len(rally_json) < 1:
|
|
||||||
self.logger.error("Issue with Rally Results")
|
|
||||||
return False
|
return False
|
||||||
for metrics in rally_json[0]['result']:
|
es_ts = datetime.datetime.utcnow()
|
||||||
|
for metrics in json_doc[0]['result']:
|
||||||
for workload in metrics:
|
for workload in metrics:
|
||||||
if type(metrics[workload]) is dict:
|
if type(metrics[workload]) is dict:
|
||||||
for value in metrics[workload]:
|
for value in metrics[workload]:
|
||||||
@ -146,47 +176,56 @@ class Rally(WorkloadBase.WorkloadBase):
|
|||||||
iteration = 1
|
iteration = 1
|
||||||
workload_name = value
|
workload_name = value
|
||||||
if value.find('(') is not -1:
|
if value.find('(') is not -1:
|
||||||
iteration = re.findall('\d+', value)
|
iteration = re.findall('\d+', value)[0]
|
||||||
workload_name = value.split('(')[0]
|
workload_name = value.split('(')[0]
|
||||||
error = {'action': workload_name.strip(),
|
error = {'action': workload_name.strip(),
|
||||||
'browbeat_rerun': run,
|
|
||||||
'iteration': iteration,
|
'iteration': iteration,
|
||||||
'error_type': metrics['error'][0],
|
'error_type': metrics['error'][0],
|
||||||
'error_msg': metrics['error'][1],
|
'error_msg': metrics['error'][1],
|
||||||
'result': task_id,
|
|
||||||
'timestamp': str(es_ts).replace(" ", "T"),
|
'timestamp': str(es_ts).replace(" ", "T"),
|
||||||
'rally_setup': rally_json[0]['key'],
|
'rally_setup': json_doc[0]['key']
|
||||||
'scenario': scenario_name,
|
|
||||||
}
|
}
|
||||||
error_result = self.elastic.combine_metadata(error)
|
if len(metadata) > 0:
|
||||||
index_status = self.elastic.index_result(error_result, test_name, result_dir,
|
error.update(metadata)
|
||||||
workload, 'error')
|
errors.append(error)
|
||||||
if index_status is False:
|
|
||||||
failure = True
|
|
||||||
for workload in rally_data:
|
for workload in rally_data:
|
||||||
if not type(rally_data[workload]) is dict:
|
if not type(rally_data[workload]) is dict:
|
||||||
iteration = 1
|
iteration = 1
|
||||||
workload_name = workload
|
workload_name = workload
|
||||||
if workload.find('(') is not -1:
|
if workload.find('(') is not -1:
|
||||||
iteration = re.findall('\d+', workload)
|
iteration = re.findall('\d+', workload)[0]
|
||||||
workload_name = workload.split('(')[0]
|
workload_name = workload.split('(')[0]
|
||||||
rally_stats = {'result': task_id,
|
rally_stats = {'action': workload_name.strip(),
|
||||||
'action': workload_name.strip(),
|
|
||||||
'browbeat_rerun': run,
|
|
||||||
'iteration': iteration,
|
'iteration': iteration,
|
||||||
'timestamp': str(es_ts).replace(" ", "T"),
|
'timestamp': str(es_ts).replace(" ", "T"),
|
||||||
'grafana_url': [self.grafana.grafana_urls()],
|
'grafana_url': [self.grafana.grafana_urls()],
|
||||||
'scenario': scenario_name,
|
'rally_setup': json_doc[0]['key'],
|
||||||
'rally_setup': rally_json[0]['key'],
|
|
||||||
'raw': rally_data[workload]}
|
'raw': rally_data[workload]}
|
||||||
result = self.elastic.combine_metadata(rally_stats)
|
if len(metadata) > 0:
|
||||||
index_status = self.elastic.index_result(result, test_name, result_dir, workload)
|
rally_stats.update(metadata)
|
||||||
if index_status is False:
|
results.append(rally_stats)
|
||||||
failure = True
|
return errors, results
|
||||||
if failure:
|
|
||||||
return False
|
def json_result(self, task_id, scenario_name, run, test_name, result_dir):
|
||||||
else:
|
success = True
|
||||||
return True
|
self.logger.info("Loading Task_ID {} JSON".format(task_id))
|
||||||
|
rally_json = self.elastic.load_json(self.gen_scenario_json(task_id))
|
||||||
|
errors, results = self.json_parse(rally_json, {'scenario': scenario_name,
|
||||||
|
'browbeat_rerun': run,
|
||||||
|
'result': task_id})
|
||||||
|
for error in errors:
|
||||||
|
error_result = self.elastic.combine_metadata(error)
|
||||||
|
status = self.elastic.index_result(error_result, test_name, result_dir,
|
||||||
|
'rally', 'error')
|
||||||
|
if not status:
|
||||||
|
success = False
|
||||||
|
for result in results:
|
||||||
|
result = self.elastic.combine_metadata(result)
|
||||||
|
status = self.elastic.index_result(
|
||||||
|
result, test_name, result_dir, 'rally')
|
||||||
|
if not status:
|
||||||
|
success = False
|
||||||
|
return success
|
||||||
|
|
||||||
def start_workloads(self):
|
def start_workloads(self):
|
||||||
"""Iterates through all rally scenarios in browbeat yaml config file"""
|
"""Iterates through all rally scenarios in browbeat yaml config file"""
|
||||||
@ -239,7 +278,8 @@ class Rally(WorkloadBase.WorkloadBase):
|
|||||||
del scenario['concurrency']
|
del scenario['concurrency']
|
||||||
else:
|
else:
|
||||||
concurrencies = def_concurrencies
|
concurrencies = def_concurrencies
|
||||||
concurrency_count_dict = collections.Counter(concurrencies)
|
concurrency_count_dict = collections.Counter(
|
||||||
|
concurrencies)
|
||||||
if 'times' not in scenario:
|
if 'times' not in scenario:
|
||||||
scenario['times'] = def_times
|
scenario['times'] = def_times
|
||||||
|
|
||||||
@ -260,7 +300,8 @@ class Rally(WorkloadBase.WorkloadBase):
|
|||||||
self.logger.debug("Duplicate concurrency {} found,"
|
self.logger.debug("Duplicate concurrency {} found,"
|
||||||
" setting test name"
|
" setting test name"
|
||||||
" to {}".format(concurrency, test_name))
|
" to {}".format(concurrency, test_name))
|
||||||
concurrency_count_dict[concurrency] -= 1
|
concurrency_count_dict[
|
||||||
|
concurrency] -= 1
|
||||||
|
|
||||||
if not result_dir:
|
if not result_dir:
|
||||||
self.logger.error(
|
self.logger.error(
|
||||||
@ -311,7 +352,8 @@ class Rally(WorkloadBase.WorkloadBase):
|
|||||||
index_status = self.json_result(
|
index_status = self.json_result(
|
||||||
task_id, scenario_name, run, test_name, result_dir)
|
task_id, scenario_name, run, test_name, result_dir)
|
||||||
self.get_time_dict(to_time, from_time,
|
self.get_time_dict(to_time, from_time,
|
||||||
benchmark['name'], new_test_name,
|
benchmark[
|
||||||
|
'name'], new_test_name,
|
||||||
workload, "pass", index_status)
|
workload, "pass", index_status)
|
||||||
else:
|
else:
|
||||||
self.get_time_dict(to_time, from_time, benchmark[
|
self.get_time_dict(to_time, from_time, benchmark[
|
||||||
|
79
lib/Tools.py
79
lib/Tools.py
@ -17,9 +17,11 @@ import logging
|
|||||||
import os
|
import os
|
||||||
import subprocess
|
import subprocess
|
||||||
import yaml
|
import yaml
|
||||||
|
import re
|
||||||
from pykwalify import core as pykwalify_core
|
from pykwalify import core as pykwalify_core
|
||||||
from pykwalify import errors as pykwalify_errors
|
from pykwalify import errors as pykwalify_errors
|
||||||
|
|
||||||
|
|
||||||
class Tools(object):
|
class Tools(object):
|
||||||
|
|
||||||
def __init__(self, config=None):
|
def __init__(self, config=None):
|
||||||
@ -59,32 +61,38 @@ class Tools(object):
|
|||||||
|
|
||||||
# Create directory for results
|
# Create directory for results
|
||||||
def create_results_dir(self, results_dir, timestamp, service, scenario):
|
def create_results_dir(self, results_dir, timestamp, service, scenario):
|
||||||
the_directory = "{}/{}/{}/{}".format(results_dir, timestamp, service, scenario)
|
the_directory = "{}/{}/{}/{}".format(results_dir,
|
||||||
|
timestamp, service, scenario)
|
||||||
if not os.path.isdir(the_directory):
|
if not os.path.isdir(the_directory):
|
||||||
try:
|
try:
|
||||||
os.makedirs(the_directory)
|
os.makedirs(the_directory)
|
||||||
except OSError as err:
|
except OSError as err:
|
||||||
self.logger.error("Error creating the results directory: {}".format(err))
|
self.logger.error(
|
||||||
|
"Error creating the results directory: {}".format(err))
|
||||||
return False
|
return False
|
||||||
return the_directory
|
return the_directory
|
||||||
|
|
||||||
def _load_config(self, path):
|
def _load_config(self, path, validate=True):
|
||||||
try:
|
try:
|
||||||
stream = open(path, 'r')
|
stream = open(path, 'r')
|
||||||
except IOError:
|
except IOError:
|
||||||
self.logger.error("Configuration file {} passed is missing".format(path))
|
self.logger.error(
|
||||||
|
"Configuration file {} passed is missing".format(path))
|
||||||
exit(1)
|
exit(1)
|
||||||
config = yaml.load(stream)
|
config = yaml.load(stream)
|
||||||
stream.close()
|
stream.close()
|
||||||
self.config = config
|
self.config = config
|
||||||
self.validate_yaml()
|
if validate:
|
||||||
|
self.validate_yaml()
|
||||||
return config
|
return config
|
||||||
|
|
||||||
def validate_yaml(self):
|
def validate_yaml(self):
|
||||||
self.logger.info("Validating the configuration file passed by the user")
|
self.logger.info(
|
||||||
|
"Validating the configuration file passed by the user")
|
||||||
stream = open("lib/validate.yaml", 'r')
|
stream = open("lib/validate.yaml", 'r')
|
||||||
schema = yaml.load(stream)
|
schema = yaml.load(stream)
|
||||||
check = pykwalify_core.Core(source_data=self.config, schema_data=schema)
|
check = pykwalify_core.Core(
|
||||||
|
source_data=self.config, schema_data=schema)
|
||||||
try:
|
try:
|
||||||
check.validate(raise_exception=True)
|
check.validate(raise_exception=True)
|
||||||
self.logger.info("Validation successful")
|
self.logger.info("Validation successful")
|
||||||
@ -110,12 +118,14 @@ class Tools(object):
|
|||||||
meta = self.config['elasticsearch']['metadata_files']
|
meta = self.config['elasticsearch']['metadata_files']
|
||||||
for _meta in meta:
|
for _meta in meta:
|
||||||
if not os.path.isfile(_meta['file']):
|
if not os.path.isfile(_meta['file']):
|
||||||
self.logger.error("Metadata file {} is not present".format(_meta['file']))
|
self.logger.error(
|
||||||
|
"Metadata file {} is not present".format(_meta['file']))
|
||||||
return False
|
return False
|
||||||
return True
|
return True
|
||||||
|
|
||||||
def gather_metadata(self):
|
def gather_metadata(self):
|
||||||
os.putenv("ANSIBLE_SSH_ARGS"," -F {}".format(self.config['ansible']['ssh_config']))
|
os.putenv("ANSIBLE_SSH_ARGS",
|
||||||
|
" -F {}".format(self.config['ansible']['ssh_config']))
|
||||||
ansible_cmd = \
|
ansible_cmd = \
|
||||||
'ansible-playbook -i {} {}' \
|
'ansible-playbook -i {} {}' \
|
||||||
.format(self.config['ansible']['hosts'], self.config['ansible']['metadata'])
|
.format(self.config['ansible']['hosts'], self.config['ansible']['metadata'])
|
||||||
@ -126,3 +136,54 @@ class Tools(object):
|
|||||||
else:
|
else:
|
||||||
self.logger.info("Metadata about cloud has been gathered")
|
self.logger.info("Metadata about cloud has been gathered")
|
||||||
return True
|
return True
|
||||||
|
|
||||||
|
def post_process(self, cli):
|
||||||
|
workloads = {}
|
||||||
|
workloads['shaker'] = re.compile("shaker")
|
||||||
|
workloads['perfkit'] = re.compile("perfkit")
|
||||||
|
workloads['rally'] = re.compile("(?!perfkit)|(?!shaker)")
|
||||||
|
""" Iterate through dir structure """
|
||||||
|
results = {}
|
||||||
|
if os.path.isdir(cli.path):
|
||||||
|
for dirname, dirnames, files in os.walk(cli.path):
|
||||||
|
self.logger.info("Inspecting : %s" % dirname)
|
||||||
|
results[dirname] = files
|
||||||
|
else:
|
||||||
|
self.logger.error("Path does not exist")
|
||||||
|
return False
|
||||||
|
|
||||||
|
""" Capture per-workload results """
|
||||||
|
workload_results = {}
|
||||||
|
json = re.compile("\.json")
|
||||||
|
if len(results) > 0:
|
||||||
|
for path in results:
|
||||||
|
for regex in workloads:
|
||||||
|
if re.findall(workloads[regex], path):
|
||||||
|
if regex not in workload_results:
|
||||||
|
workload_results[regex] = []
|
||||||
|
for file in results[path]:
|
||||||
|
if (re.findall(json, file) and
|
||||||
|
'result_index-es' not in file):
|
||||||
|
workload_results[regex].append(
|
||||||
|
"{}/{}".format(path, file))
|
||||||
|
else:
|
||||||
|
self.logger.error("Results are empty")
|
||||||
|
return False
|
||||||
|
|
||||||
|
""" Iterate through each workload result, generate ES JSON """
|
||||||
|
if len(workload_results) > 0:
|
||||||
|
for workload in workload_results:
|
||||||
|
if workload is "rally":
|
||||||
|
rally = Rally.Rally(self.config)
|
||||||
|
for file in workload_results[workload]:
|
||||||
|
errors, results = rally.file_to_json(file)
|
||||||
|
return True
|
||||||
|
if cli.es:
|
||||||
|
# Stub for when we want to push to ES.
|
||||||
|
continue
|
||||||
|
if workload is "shaker":
|
||||||
|
# Stub for Shaker.
|
||||||
|
continue
|
||||||
|
if workload is "perfkit":
|
||||||
|
# Stub for PerfKit.
|
||||||
|
continue
|
||||||
|
Loading…
Reference in New Issue
Block a user