apache · xinrong-meng · Jun 27, 2025 · Jun 27, 2025 · Jun 27, 2025 · Jun 30, 2025
diff --git a/python/pyspark/pandas/series.py b/python/pyspark/pandas/series.py
@@ -104,6 +104,7 @@
 from pyspark.pandas.plot import PandasOnSparkPlotAccessor
 from pyspark.pandas.utils import (
     combine_frames,
+    is_ansi_mode_enabled,
     is_name_like_tuple,
     is_name_like_value,
     name_like_string,
@@ -5660,11 +5661,21 @@ def dot(self, other: Union["Series", DataFrame]) -> Union[Scalar, "Series"]:
         y   -14
         dtype: int64
         """
+        spark_session = self._internal.spark_frame.sparkSession
         if not same_anchor(self, other):
-            if get_option("compute.eager_check") and not cast(
-                ps.Index, self.index.sort_values()
-            ).equals(cast(ps.Index, other.index.sort_values())):
-                raise ValueError("matrices are not aligned")
+            if get_option("compute.eager_check"):
+                if is_ansi_mode_enabled(spark_session):
+                    # In ANSI, "equals" leads to implicit casting which may cause CAST_INVALID_INPUT
+                    # Instead, we compare raw index objects collected to the driver
+                    if sorted(ps.Index(self.index).tolist()) != sorted(
+                        ps.Index(other.index).tolist()
+                    ):
+                        raise ValueError("matrices are not aligned")
+                else:
+                    if not cast(ps.Index, self.index.sort_values()).equals(
+                        cast(ps.Index, other.index.sort_values())
+                    ):
+                        raise ValueError("matrices are not aligned")
             elif len(self.index) != len(other.index):
                 raise ValueError("matrices are not aligned")
 

diff --git a/python/pyspark/pandas/tests/diff_frames_ops/test_dot_frame.py b/python/pyspark/pandas/tests/diff_frames_ops/test_dot_frame.py
@@ -21,7 +21,6 @@
 from pyspark.pandas.config import set_option, reset_option
 from pyspark.testing.pandasutils import PandasOnSparkTestCase
 from pyspark.testing.sqlutils import SQLTestUtils
-from pyspark.testing.utils import is_ansi_mode_test, ansi_mode_not_supported_message
 
 
 class DiffFramesDotFrameMixin:
@@ -35,7 +34,6 @@ def tearDownClass(cls):
         reset_option("compute.ops_on_diff_frames")
         super().tearDownClass()
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_frame_dot(self):
         pdf = pd.DataFrame([[0, 1, -2, -1], [1, 1, 1, 1]])
         psdf = ps.from_pandas(pdf)

diff --git a/python/pyspark/pandas/tests/series/test_series.py b/python/pyspark/pandas/tests/series/test_series.py
@@ -662,7 +662,6 @@ def test_items(self):
             self.assert_eq(p_name, k_name)
             self.assert_eq(p_items, k_items)
 
-    @unittest.skipIf(is_ansi_mode_test, ansi_mode_not_supported_message)
     def test_dot(self):
         pdf = pd.DataFrame({"a": [1, 2, 3], "b": [4, 5, 6]})
         psdf = ps.from_pandas(pdf)