mirror of
https://github.com/apache/impala.git
synced 2025-12-19 18:12:08 -05:00
This change adds get_workload() to ImpalaTestSuite and removes it from all test suites that already returned 'functional-query'. get_workload() is also removed from CustomClusterTestSuite which used to return 'tpch'. All other changes besides impala_test_suite.py and custom_cluster_test_suite.py are just mass removals of get_workload() functions. The behavior is only changed in custom cluster tests that didn't override get_workload(). By returning 'functional-query' instead of 'tpch', exploration_strategy() will no longer return 'core' in 'exhaustive' test runs. See IMPALA-3947 on why workload affected exploration_strategy. An example for affected test is TestCatalogHMSFailures which was skipped both in core and exhaustive runs before this change. get_workload() functions that return a different workload than 'functional-query' are not changed - it is possible that some of these also don't handle exploration_strategy() as expected, but individually checking these tests is out of scope in this patch. Change-Id: I9ec6c41ffb3a30e1ea2de773626d1485c69fe115 Reviewed-on: http://gerrit.cloudera.org:8080/22726 Reviewed-by: Riza Suminto <riza.suminto@cloudera.com> Reviewed-by: Daniel Becker <daniel.becker@cloudera.com> Tested-by: Impala Public Jenkins <impala-public-jenkins@cloudera.com>
118 lines
4.9 KiB
Python
118 lines
4.9 KiB
Python
# Licensed to the Apache Software Foundation (ASF) under one
|
|
# or more contributor license agreements. See the NOTICE file
|
|
# distributed with this work for additional information
|
|
# regarding copyright ownership. The ASF licenses this file
|
|
# to you under the Apache License, Version 2.0 (the
|
|
# "License"); you may not use this file except in compliance
|
|
# with the License. You may obtain a copy of the License at
|
|
#
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
#
|
|
# Unless required by applicable law or agreed to in writing,
|
|
# software distributed under the License is distributed on an
|
|
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
# KIND, either express or implied. See the License for the
|
|
# specific language governing permissions and limitations
|
|
# under the License.
|
|
|
|
from __future__ import absolute_import, division, print_function
|
|
from tests.common.impala_test_suite import ImpalaTestSuite
|
|
from tests.common.test_dimensions import (
|
|
create_single_exec_option_dimension,
|
|
create_uncompressed_text_dimension)
|
|
from tests.util.event_processor_utils import EventProcessorUtils
|
|
from tests.util.filesystem_utils import get_fs_path
|
|
|
|
|
|
class TestTestcaseBuilder(ImpalaTestSuite):
|
|
|
|
@classmethod
|
|
def add_test_dimensions(cls):
|
|
super(TestTestcaseBuilder, cls).add_test_dimensions()
|
|
# This test only needs to be run once.
|
|
cls.ImpalaTestMatrix.add_dimension(create_single_exec_option_dimension())
|
|
cls.ImpalaTestMatrix.add_dimension(
|
|
create_uncompressed_text_dimension(cls.get_workload()))
|
|
|
|
def test_query_without_from(self):
|
|
self._test_export_and_import(0, 0, 0, "SELECT 5 * 20")
|
|
|
|
def test_query_with_tbls(self, unique_database):
|
|
"""Verify the basic usage. Use a unique database so the import won't impact the
|
|
metadata used by other tests"""
|
|
self.client.execute(
|
|
"create table {0}.alltypes partitioned by (`year`, `month`) as "
|
|
"select * from functional.alltypes".format(unique_database))
|
|
self.client.execute(
|
|
"create view {0}.alltypes_view as select * from {0}.alltypes"
|
|
.format(unique_database))
|
|
original_part_ids = self.get_partition_id_set(unique_database, "alltypes")
|
|
|
|
# Test SELECT on a view. The view will be expanded and the underlying table will also
|
|
# be exported.
|
|
self._test_export_and_import(
|
|
1, 1, 1,
|
|
"select count(*) from {0}.alltypes_view".format(unique_database),
|
|
[unique_database + ".alltypes"], [unique_database + ".alltypes_view"])
|
|
|
|
res = self.execute_query(
|
|
"show partitions {0}.alltypes".format(unique_database),
|
|
{"PLANNER_TESTCASE_MODE": True})
|
|
# 24 partitions with a Total line
|
|
assert len(res.data) == 25
|
|
|
|
res = self.execute_query(
|
|
"show files in {0}.alltypes".format(unique_database),
|
|
{"PLANNER_TESTCASE_MODE": True})
|
|
# Each partition shoule have exactly one file
|
|
assert len(res.data) == 24
|
|
|
|
# Verify the partition ids changed
|
|
new_part_ids = self.get_partition_id_set(unique_database, "alltypes")
|
|
assert new_part_ids != original_part_ids
|
|
|
|
def _test_export_and_import(self, num_dbs, num_tbls, num_views, query,
|
|
tbls=(), views=()):
|
|
tmp_path = get_fs_path("/tmp")
|
|
# Make sure /tmp dir exists
|
|
if not self.filesystem_client.exists(tmp_path):
|
|
self.filesystem_client.make_dir(tmp_path)
|
|
# Generate Testcase Data for query without table reference
|
|
testcase_generate_query = "COPY TESTCASE TO '%s' %s" % (tmp_path, query)
|
|
result = self.execute_query(testcase_generate_query)
|
|
assert len(result.data) == 1, "Testcase builder wrong result: {0}".format(result.data)
|
|
|
|
# Check file exists
|
|
testcase_path = str(result.data)[1: -1]
|
|
index = testcase_path.index(tmp_path)
|
|
hdfs_path = testcase_path[index:-1]
|
|
assert self.filesystem_client.exists(hdfs_path), \
|
|
"File not generated {0}".format(hdfs_path)
|
|
|
|
result = self.execute_query("explain " + query, {"explain_level": 2})
|
|
original_plan = result.data
|
|
|
|
# Remove the original tables and views to make sure we use the imported ones.
|
|
for t in tbls:
|
|
self.execute_query("drop table if exists " + t)
|
|
for v in views:
|
|
self.execute_query("drop view if exists " + v)
|
|
# Make sure the DROP events are processed so the imported ones won't be dropped
|
|
# by them
|
|
EventProcessorUtils.wait_for_event_processing(self)
|
|
|
|
# Test load testcase works
|
|
testcase_load_query = "COPY TESTCASE FROM {0}".format(testcase_path)
|
|
result = self.execute_query(testcase_load_query)
|
|
expected_msg = "{0} db(s), {1} table(s) and {2} view(s) imported for query".format(
|
|
num_dbs, num_tbls, num_views)
|
|
assert expected_msg in result.get_data()
|
|
|
|
result = self.execute_query("explain " + query, {"explain_level": 2})
|
|
new_plan = result.data
|
|
assert new_plan == original_plan
|
|
|
|
# Only delete testcase file if everything works fine.
|
|
status = self.filesystem_client.delete_file_dir(hdfs_path)
|
|
assert status, "Delete generated testcase file failed with {0}".format(status)
|