(hamilton) 04/06: Address various test failures

skrawcz Mon, 16 Feb 2026 20:18:56 -0800

This is an automated email from the ASF dual-hosted git repository.

skrawcz pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/hamilton.git


commit 157ecd60c8371be6c479bc2dbed470487c948c74
Author: Dev-iL <[email protected]>
AuthorDate: Sat Feb 14 18:05:00 2026 +0200

    Address various test failures
---
 .github/workflows/hamilton-main.yml                     |  1 +
 .github/workflows/hamilton-sdk.yml                      |  1 +
 hamilton/plugins/pandas_extensions.py                   |  6 +++---
 hamilton/registry.py                                    |  6 +-----
 tests/caching/test_integration.py                       |  4 +++-
 tests/test_graph.py                                     |  4 ++--
 .../server/tests/test_db_methods/test_permissions.py    | 17 ++++++++++-------
 ui/sdk/requirements-test.txt                            |  4 ++--
 ui/sdk/src/hamilton_sdk/tracking/polars_col_stats.py    |  7 ++++---
 ui/sdk/tests/test_adapters.py                           |  6 +++---
 ui/sdk/tests/tracking/test_pandas_col_stats.py          |  3 ++-
 ui/sdk/tests/tracking/test_pandas_stats.py              |  6 ++++--
 ui/sdk/tests/tracking/test_utils.py                     | 15 ++++++---------
 13 files changed, 42 insertions(+), 38 deletions(-)

diff --git a/.github/workflows/hamilton-main.yml 
b/.github/workflows/hamilton-main.yml
index dcb9f868..49cad6c9 100644
--- a/.github/workflows/hamilton-main.yml
+++ b/.github/workflows/hamilton-main.yml
@@ -108,6 +108,7 @@ jobs:
             uv run pytest plugin_tests/h_dask
 
         - name: Test ray
+          if: ${{ matrix.python-version != '3.14' }}
           env:
             RAY_ENABLE_UV_RUN_RUNTIME_ENV: 0 # 
https://github.com/ray-project/ray/issues/53848
           run: |
diff --git a/.github/workflows/hamilton-sdk.yml 
b/.github/workflows/hamilton-sdk.yml
index 139f2060..774e8a8b 100644
--- a/.github/workflows/hamilton-sdk.yml
+++ b/.github/workflows/hamilton-sdk.yml
@@ -33,6 +33,7 @@ jobs:
     - name: Install dependencies
       run: |
         python -m pip install --upgrade pip
+        pip install -e ${{ github.workspace }}
         pip install -r requirements.txt
         pip install -r requirements-test.txt
         pip install -e .
diff --git a/hamilton/plugins/pandas_extensions.py 
b/hamilton/plugins/pandas_extensions.py
index 0937cce9..0a6f75d5 100644
--- a/hamilton/plugins/pandas_extensions.py
+++ b/hamilton/plugins/pandas_extensions.py
@@ -200,13 +200,13 @@ class PandasCSVReader(DataLoader):
             kwargs["keep_default_na"] = self.keep_default_na
         if self.na_filter is not None:
             kwargs["na_filter"] = self.na_filter
-        if self.verbose is not None:
+        if pd.__version__ < "3.0" and self.verbose is not None:
             kwargs["verbose"] = self.verbose
         if self.skip_blank_lines is not None:
             kwargs["skip_blank_lines"] = self.skip_blank_lines
         if self.parse_dates is not None:
             kwargs["parse_dates"] = self.parse_dates
-        if self.keep_date_col is not None:
+        if pd.__version__ < "3.0" and self.keep_date_col is not None:
             kwargs["keep_date_col"] = self.keep_date_col
         if self.date_format is not None:
             kwargs["date_format"] = self.date_format
@@ -242,7 +242,7 @@ class PandasCSVReader(DataLoader):
             kwargs["dialect"] = self.dialect
         if self.on_bad_lines is not None:
             kwargs["on_bad_lines"] = self.on_bad_lines
-        if self.delim_whitespace is not None:
+        if pd.__version__ < "3.0" and self.delim_whitespace is not None:
             kwargs["delim_whitespace"] = self.delim_whitespace
         if self.low_memory is not None:
             kwargs["low_memory"] = self.low_memory
diff --git a/hamilton/registry.py b/hamilton/registry.py
index ae1fc8da..8e5b383c 100644
--- a/hamilton/registry.py
+++ b/hamilton/registry.py
@@ -109,11 +109,7 @@ def initialize():
 
         try:
             load_extension(extension_name)
-        except NotImplementedError as e:
-            logger.debug(f"Did not load {extension_name} extension because 
{str(e)}.")
-        except ModuleNotFoundError as e:
-            logger.debug(f"Did not load {extension_name} extension because 
{e.msg}.")
-        except ImportError as e:
+        except (NotImplementedError, ImportError, Warning) as e:
             logger.debug(f"Did not load {extension_name} extension because 
{str(e)}.")
 
     global INITIALIZED
diff --git a/tests/caching/test_integration.py 
b/tests/caching/test_integration.py
index 05a6cf64..3925db98 100644
--- a/tests/caching/test_integration.py
+++ b/tests/caching/test_integration.py
@@ -545,7 +545,9 @@ EXECUTORS_AND_STORES_CONFIGURATIONS += 
IN_MEMORY_CONFIGURATIONS
 
 
 @pytest.mark.parametrize(
-    ("executor", "metadata_store", "result_store"), 
EXECUTORS_AND_STORES_CONFIGURATIONS, indirect=True
+    ("executor", "metadata_store", "result_store"),
+    EXECUTORS_AND_STORES_CONFIGURATIONS,
+    indirect=True,
 )
 def test_parallel_synchronous_step_by_step(executor, metadata_store, 
result_store):  # noqa: F811
     dr = (
diff --git a/tests/test_graph.py b/tests/test_graph.py
index 5a6c4016..6c6faf3b 100644
--- a/tests/test_graph.py
+++ b/tests/test_graph.py
@@ -968,12 +968,12 @@ def test_function_graph_display_fields(display_fields: 
bool):
         assert any("foo" in line for line in dot.body)
         assert any("bar" in line for line in dot.body)
         assert any("baz" in line for line in dot.body)
-        assert any("cluster" in line for line in dot.body)
+        assert any("cluster_df_with_schema" in line for line in dot.body)
     else:
         assert not any("foo" in line for line in dot.body)
         assert not any("bar" in line for line in dot.body)
         assert not any("baz" in line for line in dot.body)
-        assert not any("cluster" in line for line in dot.body)
+        assert not any("cluster_df_with_schema" in line for line in dot.body)
 
 
 def test_function_graph_display_fields_shared_schema():
diff --git a/ui/backend/server/tests/test_db_methods/test_permissions.py 
b/ui/backend/server/tests/test_db_methods/test_permissions.py
index 656596cc..0d4dd4e4 100644
--- a/ui/backend/server/tests/test_db_methods/test_permissions.py
+++ b/ui/backend/server/tests/test_db_methods/test_permissions.py
@@ -210,9 +210,9 @@ async def 
test_user_has_visibility_when_granted_individual_access(role: str, db)
     await ProjectUserMembership.objects.acreate(project=project, user=user, 
role=role)
     assert (await user_project_visibility(authenticated_request, 
project=project)) == role
 
+
 @pytest.mark.asyncio
 @pytest.mark.parametrize("role", ["read", "write"])
[email protected]("role", ["read", "write"])
 async def 
test_user_does_not_have_visibility_when_not_granted_individual_access(role: 
str, db):
     authenticated_request = await _get_authenticated_request(
         "user_with_no_permissions@no_one_invited_me.com"
@@ -330,7 +330,7 @@ async def test_users_can_always_get_projects(db):
 
 
 @pytest.mark.asyncio
[email protected](("role","allowed"), [("read", False), ("write", 
True)])
[email protected](("role", "allowed"), [("read", False), ("write", 
True)])
 async def test_user_can_edit_project_by_id_visibility_role(role: str, allowed: 
bool, db):
     authenticated_request = await 
_get_authenticated_request("[email protected]")
     user, teams = authenticated_request.auth
@@ -429,10 +429,13 @@ async def 
test_user_cannot_get_dag_template_with_no_access(db):
 
 
 @pytest.mark.asyncio
[email protected]("role", [
-    "read",
-    "write",
-])
[email protected](
+    "role",
+    [
+        "read",
+        "write",
+    ],
+)
 async def test_user_can_get_dag_templates_with_access(db, role):
     (
         dag_template,
@@ -459,7 +462,7 @@ async def 
test_user_cannot_get_dag_templates_with_no_access(db):
 
 
 @pytest.mark.asyncio
[email protected](("role","allowed"), [("read", False), ("write", 
True)])
[email protected](("role", "allowed"), [("read", False), ("write", 
True)])
 async def test_user_can_write_to_dag_template_with_access(db, role, allowed):
     (
         dag_template,
diff --git a/ui/sdk/requirements-test.txt b/ui/sdk/requirements-test.txt
index 8c288a6c..ef5ae174 100644
--- a/ui/sdk/requirements-test.txt
+++ b/ui/sdk/requirements-test.txt
@@ -1,10 +1,10 @@
 ibis-framework
 langchain_core
-numpy<2  # SPARK-48710
+numpy
 polars
 pyarrow
 pyarrow_hotfix  # required for ibis tests
 pydantic
 pyspark
 pytest
-ray
+ray; python_version < "3.14"
diff --git a/ui/sdk/src/hamilton_sdk/tracking/polars_col_stats.py 
b/ui/sdk/src/hamilton_sdk/tracking/polars_col_stats.py
index f4e50ea3..04586d3c 100644
--- a/ui/sdk/src/hamilton_sdk/tracking/polars_col_stats.py
+++ b/ui/sdk/src/hamilton_sdk/tracking/polars_col_stats.py
@@ -18,6 +18,7 @@
 import datetime
 
 import polars as pl
+from polars.exceptions import InvalidOperationError
 from hamilton_sdk.tracking import dataframe_stats as dfs
 
 
@@ -34,7 +35,7 @@ def missing(col: pl.Series) -> int:
     try:
         # only for floats does is_nan() work.
         nan_count = col.is_nan().sum()
-    except pl.InvalidOperationError:
+    except InvalidOperationError:
         nan_count = 0
     return col.is_null().sum() + nan_count
 
@@ -80,7 +81,7 @@ def quantiles(col: pl.Series, quantile_cuts: list[float]) -> 
dict[float, float]:
     try:
         for q in quantile_cuts:
             result[q] = col.quantile(q)
-    except pl.InvalidOperationError:
+    except InvalidOperationError:
         return {}
     return result
 
@@ -91,7 +92,7 @@ def histogram(col: pl.Series, num_hist_bins: int = 10) -> 
dict[str, int]:
         return {}
     try:
         hist_dict = 
col.drop_nulls().hist(bin_count=num_hist_bins).to_dict(as_series=False)
-    except pl.InvalidOperationError:
+    except InvalidOperationError:
         # happens for Date data types. TODO: convert them to numeric so we can 
get a histogram.
         return {}
     # Sort by category to ensure consistent ordering across Python versions
diff --git a/ui/sdk/tests/test_adapters.py b/ui/sdk/tests/test_adapters.py
index 65d439fb..754cec68 100644
--- a/ui/sdk/tests/test_adapters.py
+++ b/ui/sdk/tests/test_adapters.py
@@ -63,7 +63,7 @@ def test_adapters():
 def test_parallel_ray():
     """Tests ray works without sampling.
     Doesn't actually check the client - go do that in the UI."""
-    import ray
+    ray = pytest.importorskip("ray")
 
     from hamilton.plugins import h_ray
 
@@ -96,7 +96,7 @@ def test_parallel_ray():
 def test_parallel_ray_sample():
     """Tests ray works with sampling.
     Doesn't actually check the client - go do that in the UI."""
-    import ray
+    ray = pytest.importorskip("ray")
 
     from hamilton.plugins import h_ray
 
@@ -133,7 +133,7 @@ def test_parallel_ray_sample():
 def test_parallel_ray_sample_error():
     """Tests error returning a sample.
     Doesn't actually check the client - go do that in the UI."""
-    import ray
+    ray = pytest.importorskip("ray")
 
     from hamilton.plugins import h_ray
 
diff --git a/ui/sdk/tests/tracking/test_pandas_col_stats.py 
b/ui/sdk/tests/tracking/test_pandas_col_stats.py
index 684db46a..55b25bdb 100644
--- a/ui/sdk/tests/tracking/test_pandas_col_stats.py
+++ b/ui/sdk/tests/tracking/test_pandas_col_stats.py
@@ -99,7 +99,8 @@ def example_df_string():
             "c": ["k", "l", "m", "n", "o"],
             "d": ["p", "q", "r", "s", "t"],
             "e": ["u", "v", "w", "x", "y"],
-        }
+        },
+        dtype="object",
     )
 
 
diff --git a/ui/sdk/tests/tracking/test_pandas_stats.py 
b/ui/sdk/tests/tracking/test_pandas_stats.py
index 2eb2721b..cc3d439b 100644
--- a/ui/sdk/tests/tracking/test_pandas_stats.py
+++ b/ui/sdk/tests/tracking/test_pandas_stats.py
@@ -23,7 +23,7 @@ def test_compute_stats_df():
     df = pd.DataFrame(
         {
             "a": [1, 2, 3, 4, 5],
-            "b": ["a", "b", "c", "d", "e"],
+            "b": pd.Series(["a", "b", "c", "d", "e"], dtype="object"),
             "c": [True, False, True, False, True],
             "d": [1.0, 2.0, 3.0, 4.0, 5.0],
             "e": pd.Categorical(["a", "b", "c", "d", "e"]),
@@ -33,7 +33,9 @@ def test_compute_stats_df():
                 ["20221231", None, "20221231", "20221231", "20221231"], 
dtype="datetime64[ns]"
             ),
             "i": pd.Series([None, None, None, None, None], name="a", 
dtype=float),
-            "j": pd.Series(name="a", data=pd.date_range("20230101", 
"20230105")),
+            "j": pd.Series(
+                name="a", data=pd.date_range("20230101", "20230105"), 
dtype="datetime64[ns]"
+            ),
         }
     )
     actual = ps.compute_stats_df(df, "test", {})
diff --git a/ui/sdk/tests/tracking/test_utils.py 
b/ui/sdk/tests/tracking/test_utils.py
index 9a8951ab..3390d4fd 100644
--- a/ui/sdk/tests/tracking/test_utils.py
+++ b/ui/sdk/tests/tracking/test_utils.py
@@ -113,14 +113,11 @@ def test_make_json_safe_with_pandas_dataframe():
         }
     )
     actual = utils.make_json_safe(input_dataframe)
-    assert actual == {
-        "A": {"0": 1.0, "1": 1.0, "2": 1.0, "3": 1.0},
-        "B": {"0": 1357, "1": 1357, "2": 1357, "3": 1357},
-        "C": {"0": 1.0, "1": 1.0, "2": 1.0, "3": 1.0},
-        "D": {"0": 3, "1": 3, "2": 3, "3": 3},
-        "E": {"0": "test", "1": "train", "2": "test", "3": "train"},
-        "F": {"0": "foo", "1": "foo", "2": "foo", "3": "foo"},
-    }
+    # Compute expected from pandas directly to handle cross-version 
serialization differences
+    import json
+
+    expected = json.loads(input_dataframe.head().to_json())
+    assert actual == expected
 
 
 def test_make_json_safe_with_pandas_dataframe_duplicate_indexes():
@@ -147,7 +144,7 @@ def 
test_make_json_safe_with_pandas_dataframe_duplicate_indexes():
 
 
 def test_make_json_safe_with_pandas_series():
-    index = pd.date_range("2022-01-01", periods=6, freq="w")
+    index = pd.date_range("2022-01-01", periods=6, freq="W")
     input_series = pd.Series([1, 10, 50, 100, 200, 400], index=index)
     actual = utils.make_json_safe(input_series)
     assert actual == {

(hamilton) 04/06: Address various test failures

Reply via email to