Files
impala/tests/metadata/test_testcase_builder.py
Csaba Ringhofer f98b697c7b IMPALA-13929: Make 'functional-query' the default workload in tests
This change adds get_workload() to ImpalaTestSuite and removes it
from all test suites that already returned 'functional-query'.
get_workload() is also removed from CustomClusterTestSuite which
used to return 'tpch'.

All other changes besides impala_test_suite.py and
custom_cluster_test_suite.py are just mass removals of
get_workload() functions.

The behavior is only changed in custom cluster tests that didn't
override get_workload(). By returning 'functional-query' instead
of 'tpch', exploration_strategy() will no longer return 'core' in
'exhaustive' test runs. See IMPALA-3947 on why workload affected
exploration_strategy. An example for affected test is
TestCatalogHMSFailures which was skipped both in core and exhaustive
runs before this change.

get_workload() functions that return a different workload than
'functional-query' are not changed - it is possible that some of
these also don't handle exploration_strategy() as expected, but
individually checking these tests is out of scope in this patch.

Change-Id: I9ec6c41ffb3a30e1ea2de773626d1485c69fe115
Reviewed-on: http://gerrit.cloudera.org:8080/22726
Reviewed-by: Riza Suminto <riza.suminto@cloudera.com>
Reviewed-by: Daniel Becker <daniel.becker@cloudera.com>
Tested-by: Impala Public Jenkins <impala-public-jenkins@cloudera.com>
2025-04-08 07:12:55 +00:00

118 lines
4.9 KiB
Python

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
from __future__ import absolute_import, division, print_function
from tests.common.impala_test_suite import ImpalaTestSuite
from tests.common.test_dimensions import (
create_single_exec_option_dimension,
create_uncompressed_text_dimension)
from tests.util.event_processor_utils import EventProcessorUtils
from tests.util.filesystem_utils import get_fs_path
class TestTestcaseBuilder(ImpalaTestSuite):
@classmethod
def add_test_dimensions(cls):
super(TestTestcaseBuilder, cls).add_test_dimensions()
# This test only needs to be run once.
cls.ImpalaTestMatrix.add_dimension(create_single_exec_option_dimension())
cls.ImpalaTestMatrix.add_dimension(
create_uncompressed_text_dimension(cls.get_workload()))
def test_query_without_from(self):
self._test_export_and_import(0, 0, 0, "SELECT 5 * 20")
def test_query_with_tbls(self, unique_database):
"""Verify the basic usage. Use a unique database so the import won't impact the
metadata used by other tests"""
self.client.execute(
"create table {0}.alltypes partitioned by (`year`, `month`) as "
"select * from functional.alltypes".format(unique_database))
self.client.execute(
"create view {0}.alltypes_view as select * from {0}.alltypes"
.format(unique_database))
original_part_ids = self.get_partition_id_set(unique_database, "alltypes")
# Test SELECT on a view. The view will be expanded and the underlying table will also
# be exported.
self._test_export_and_import(
1, 1, 1,
"select count(*) from {0}.alltypes_view".format(unique_database),
[unique_database + ".alltypes"], [unique_database + ".alltypes_view"])
res = self.execute_query(
"show partitions {0}.alltypes".format(unique_database),
{"PLANNER_TESTCASE_MODE": True})
# 24 partitions with a Total line
assert len(res.data) == 25
res = self.execute_query(
"show files in {0}.alltypes".format(unique_database),
{"PLANNER_TESTCASE_MODE": True})
# Each partition shoule have exactly one file
assert len(res.data) == 24
# Verify the partition ids changed
new_part_ids = self.get_partition_id_set(unique_database, "alltypes")
assert new_part_ids != original_part_ids
def _test_export_and_import(self, num_dbs, num_tbls, num_views, query,
tbls=(), views=()):
tmp_path = get_fs_path("/tmp")
# Make sure /tmp dir exists
if not self.filesystem_client.exists(tmp_path):
self.filesystem_client.make_dir(tmp_path)
# Generate Testcase Data for query without table reference
testcase_generate_query = "COPY TESTCASE TO '%s' %s" % (tmp_path, query)
result = self.execute_query(testcase_generate_query)
assert len(result.data) == 1, "Testcase builder wrong result: {0}".format(result.data)
# Check file exists
testcase_path = str(result.data)[1: -1]
index = testcase_path.index(tmp_path)
hdfs_path = testcase_path[index:-1]
assert self.filesystem_client.exists(hdfs_path), \
"File not generated {0}".format(hdfs_path)
result = self.execute_query("explain " + query, {"explain_level": 2})
original_plan = result.data
# Remove the original tables and views to make sure we use the imported ones.
for t in tbls:
self.execute_query("drop table if exists " + t)
for v in views:
self.execute_query("drop view if exists " + v)
# Make sure the DROP events are processed so the imported ones won't be dropped
# by them
EventProcessorUtils.wait_for_event_processing(self)
# Test load testcase works
testcase_load_query = "COPY TESTCASE FROM {0}".format(testcase_path)
result = self.execute_query(testcase_load_query)
expected_msg = "{0} db(s), {1} table(s) and {2} view(s) imported for query".format(
num_dbs, num_tbls, num_views)
assert expected_msg in result.get_data()
result = self.execute_query("explain " + query, {"explain_level": 2})
new_plan = result.data
assert new_plan == original_plan
# Only delete testcase file if everything works fine.
status = self.filesystem_client.delete_file_dir(hdfs_path)
assert status, "Delete generated testcase file failed with {0}".format(status)