Files
impala/tests/util/plugin_runner.py
ishaan 3bed0be1df Refactor the performance framework and change its execution strategy.
This patch introduces new abstractions and changes the way queries are run via the
workload runner. A new class 'Workload' is introduced, which represents the notion of a
workload in the performance framework (i.e, A set of query names mapped to query
strings).

The new workflow is:
 - run-workload acts as a driver. It accepts user parmaters for which queries to
   run and their execution strategy. It generates workload objects and passes them to the
   workload-runner.
 - The workload runner takes a workload, its execution parameters and generates a set of
   test vectors over which the workload is run iteratively.
 - A workload is executed by initialiazing a QueryExecutor for each query being run in a
   test vector. The workload executor is then responsible for execution and gathering
   results.
 - The execution details of every query being executed are are stored and returned to the
   driver (run-workload).

Change-Id: Ia16360140d65e6733e534e823bc5d5614622ab5f
Reviewed-on: http://gerrit.ent.cloudera.com:8080/3616
Reviewed-by: Taras Bobrovytsky <tbobrovytsky@cloudera.com>
Tested-by: jenkins
2014-07-25 18:17:11 -07:00

105 lines
3.9 KiB
Python

#!/usr/bin/env python
# Copyright (c) 2012 Cloudera, Inc. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import imp
import logging
import os
import pkgutil
import sys
PLUGIN_DIR = os.path.join(os.environ['IMPALA_HOME'], 'tests', 'benchmark', 'plugins')
# Setup logging for this module.
logging.basicConfig(level=logging.INFO, format='%(filename)s: %(message)s')
LOG = logging.getLogger('plugin_runner')
LOG.setLevel(level=logging.INFO)
class PluginRunner(object):
''' Loads user specified plugins, if found, and initializes them.
Looks in /tests/plugins and searches each module for plugin_name. plugin_name
is the name of the class that the user has used to implement a plugin. If the class
is found, it is initialized and added to self.__plugins. If it's not found, an error
message is logged and the plugin in not loaded.
'''
def __init__(self, plugin_infos):
self._available_modules = self._get_plugin_modules()
self._get_plugins_from_modules(plugin_infos)
@property
def plugins(self):
return self._plugins
def __getstate__(self):
state = self.__dict__.copy()
del state['_available_modules']
return state
def _get_plugin_modules(self):
''' Gets all the modules in the directory and imports them'''
modules = pkgutil.iter_modules(path=[PLUGIN_DIR])
available_modules = []
for loader, mod_name, ispkg in modules:
yield __import__("tests.benchmark.plugins.%s" % mod_name, fromlist=[mod_name])
def _get_plugins_from_modules(self, plugin_infos):
'''Look for user specified plugins in the available modules.'''
self._plugins = []
plugin_names = []
for module in self._available_modules:
for plugin_info in plugin_infos:
plugin_name, scope = self._get_plugin_info(plugin_info)
plugin_names.append(plugin_name)
if hasattr(module, plugin_name):
self._plugins.append(getattr(module, plugin_name)(scope=scope.lower()))
# The plugin(s) that could not be loaded are captured in the set difference
# between plugin_names and self.__plugins
plugins_found = [p.__name__ for p in self._plugins]
LOG.debug("Plugins found: %s" % ', '.join(plugins_found))
plugins_not_found = set(plugin_names).difference(plugins_found)
# If the user's entered a plugin that does not exist, raise an error.
if len(plugins_not_found):
msg = "Plugin(s) not found: %s" % (','.join(list(plugins_not_found)))
raise RuntimeError, msg
def _get_plugin_info(self, plugin_info):
info = plugin_info.split(':')
if len(info) == 1:
return info[0], 'query'
elif len(info) == 2:
return info[0], info[1]
else:
raise ValueError("Plugin names specified in the form <plugin_name>[:<scope>]")
def print_plugin_names(self):
for p in self._plugins:
LOG.debug("Plugin: %s, Scope: %s" % (p.__name__, p.scope))
def run_plugins_pre(self, context=None, scope=None):
if len(self._plugins) == 0: return
if context: context['scope'] = scope
for p in self._plugins:
if not scope or p.scope == scope.lower():
LOG.debug('Running pre-hook for %s at scope %s' % (p.__name__, scope))
p.run_pre_hook(context=context)
def run_plugins_post(self, context=None, scope=None):
if len(self._plugins) == 0: return
for p in self._plugins:
if not scope or p.scope == scope.lower():
LOG.debug('Running post-hook for %s at scope %s' % (p.__name__, scope))
p.run_post_hook(context=context)