This is an automated email from the ASF dual-hosted git repository.

stigahuang pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/impala.git

commit 0e3ae5c339fad3183ba8ce5c0c7d954e50dee091
Author: stiga-huang <[email protected]>
AuthorDate: Sun Apr 27 16:45:57 2025 +0800

    IMPALA-13996: Deflake test_too_many_files by creating dedicate tables
    
    TestAllowIncompleteData.test_too_many_files depends on
    tpch_parquet.lineitem to have exactly 3 data files. This is false in
    erasure coding builds in which tpch_parquet.lineitem has only 2 data
    files.
    
    This fixes the test to use dedicate tables created in the test.
    
    Change-Id: I28cec8ec4bc59f066aa15a7243b7163639706cc7
    Reviewed-on: http://gerrit.cloudera.org:8080/22824
    Reviewed-by: Jason Fehr <[email protected]>
    Tested-by: Impala Public Jenkins <[email protected]>
---
 tests/custom_cluster/test_local_catalog.py | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/tests/custom_cluster/test_local_catalog.py 
b/tests/custom_cluster/test_local_catalog.py
index 3f7da98d8..c4e92e9ba 100644
--- a/tests/custom_cluster/test_local_catalog.py
+++ b/tests/custom_cluster/test_local_catalog.py
@@ -713,11 +713,15 @@ class TestAllowIncompleteData(CustomClusterTestSuite):
     catalogd_args="--catalog_topic_mode=minimal 
--catalog_partial_fetch_max_files=1")
   def test_too_many_files(self, unique_database):
     """Test the error reporting the limit is too small"""
-    exception = self.execute_query_expect_failure(
-        self.client, "show files in tpch_parquet.lineitem")
-    err = ("Too many files to collect in table tpch_parquet.lineitem: 3. 
Current limit "
-           "is 1 configured by startup flag 'catalog_partial_fetch_max_files'. 
Consider "
-           "compacting files of the table.")
+    # Create a non-partitioned table with multiple files
+    tbl = unique_database + ".tbl"
+    self.execute_query("create table {0} (i int)".format(tbl))
+    self.execute_query("insert into {0} values (0)".format(tbl))
+    self.execute_query("insert into {0} values (1)".format(tbl))
+    exception = self.execute_query_expect_failure(self.client, "show files in 
" + tbl)
+    err = ("Too many files to collect in table {0}: 2. Current limit is 1 
configured by "
+           "startup flag 'catalog_partial_fetch_max_files'. Consider 
compacting files of"
+           " the table.").format(tbl)
     assert err in str(exception)
     self.assert_catalogd_log_contains("ERROR", err)
 

Reply via email to