(impala) 02/03: IMPALA-12742: (Addendum) add interop tests for DATE-partitioned Iceberg tables

stigahuang Wed, 31 Jan 2024 16:18:43 -0800

This is an automated email from the ASF dual-hosted git repository.

stigahuang pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/impala.git


commit 52dcf609620b18778ae99efea91cd356987b0cc3
Author: Zoltan Borok-Nagy <[email protected]>
AuthorDate: Tue Jan 30 19:12:50 2024 +0100

    IMPALA-12742: (Addendum) add interop tests for DATE-partitioned Iceberg 
tables
    
    IMPALA-12742 fixed a bug related to DATE-partitioned Iceberg tables
    and it also added several tests. Though it did not add interop tests
    between Hive and Impala. This CR fills this gap.
    
    Change-Id: I38e6626d388be3b400e2276de4bf929f673beffb
    Reviewed-on: http://gerrit.cloudera.org:8080/20976
    Reviewed-by: Impala Public Jenkins <[email protected]>
    Tested-by: Impala Public Jenkins <[email protected]>
---
 tests/query_test/test_iceberg.py | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/tests/query_test/test_iceberg.py b/tests/query_test/test_iceberg.py
index 6baea6255..8679a3e91 100644
--- a/tests/query_test/test_iceberg.py
+++ b/tests/query_test/test_iceberg.py
@@ -1503,6 +1503,13 @@ class TestIcebergV2Table(IcebergTestSuite):
     hive_output = self.run_stmt_in_hive("SELECT count(*) FROM {}.{}".format(
         db, "ice_store_sales"))
     assert hive_output == "_c0\n2601498\n"
+    hive_output = self.run_stmt_in_hive("SELECT * FROM {}.{}".format(
+        db, "ice_alltypes_part_v2"))
+    # Cut off the long header line.
+    hive_output = hive_output.split("\n", 1)
+    hive_output = hive_output[1]
+    assert hive_output == \
+        "2,true,1,11,1.1,2.222,123.321,2022-02-22,impala\n"
 
   @SkipIfFS.hive
   def test_delete_hive_read(self, vector, unique_database):
@@ -1702,6 +1709,18 @@ class TestIcebergV2Table(IcebergTestSuite):
     assert hive_results == \
         "11,21,2111,531,75.20\n"
 
+    # HIVE-28048: Hive cannot run ORDER BY queries for Iceberg tables 
partitioned by
+    # decimal columns, so we order the results ourselves.
+    hive_results = self.run_stmt_in_hive("SELECT * FROM {}.{}".format(
+        db, "ice_alltypes_part_v2"))
+    # Throw away the header line and sort the results.
+    hive_results = hive_results.split("\n", 1)[1]
+    hive_results = hive_results.strip().split("\n")
+    hive_results.sort()
+    assert hive_results == [
+        "2,true,2,11,1.1,2.222,123.321,2022-04-22,impala",
+        "3,true,3,11,1.1,2.222,123.321,2022-05-22,impala"]
+
   def test_optimize(self, vector, unique_database):
     tbl_name = unique_database + ".optimize_iceberg"
     self.execute_query("""create table {0} (i int)

(impala) 02/03: IMPALA-12742: (Addendum) add interop tests for DATE-partitioned Iceberg tables

Reply via email to