pre commit fixes v2

pandeconscious · pandeconscious · commit b90726fd73f5 · 2025-10-27T13:40:09.000Z
diff --git a/pandas/core/frame.py b/pandas/core/frame.py
@@ -11670,7 +11670,6 @@ def corr(
         if method in ("spearman", "kendall"):
             data = data._transform_ord_cat_cols_to_coded_cols()
 
-
         mat = data.to_numpy(dtype=float, na_value=np.nan, copy=False)
 
         if method == "pearson":
@@ -11966,6 +11965,7 @@ def corrwith(
         elif method in ["kendall", "spearman"] or callable(method):
             left = left._transform_ord_cat_cols_to_coded_cols()
             right = right._transform_ord_cat_cols_to_coded_cols()
+
             def c(x):
                 return nanops.nancorr(x[0], x[1], method=method)
 
@@ -11998,8 +11998,8 @@ def c(x):
 
     def _transform_ord_cat_cols_to_coded_cols(self) -> DataFrame:
         """
-        any ordered categorical columns are transformed to the respectice caregorical codes
-        other columns remain untouched
+        any ordered categorical columns are transformed to the respective
+        categorical codes while other columns remain untouched
         """
         categ = self.select_dtypes("category")
         if len(categ.columns) == 0:
diff --git a/pandas/core/series.py b/pandas/core/series.py
@@ -2686,7 +2686,7 @@ def corr(
         this, other = self.align(other, join="inner")
         if len(this) == 0:
             return np.nan
-    
+
         if method in ("spearman", "kendall"):
             if this.dtype == "category" and this.cat.ordered:
                 this = this.cat.codes.replace(-1, np.nan)
diff --git a/pandas/tests/frame/methods/test_cov_corr.py b/pandas/tests/frame/methods/test_cov_corr.py
@@ -1,4 +1,5 @@
 from itertools import combinations
+
 import numpy as np
 import pytest
 
@@ -252,24 +253,45 @@ def test_corr_numeric_only(self, meth, numeric_only):
         else:
             with pytest.raises(ValueError, match="could not convert string to float"):
                 df.corr(meth, numeric_only=numeric_only)
-    
+
     @pytest.mark.parametrize("method", ["kendall", "spearman"])
-    def test_corr_rank_ordered_categorical(self, method,):
+    def test_corr_rank_ordered_categorical(
+        self,
+        method,
+    ):
         df = DataFrame(
             {
-                "ord_cat": pd.Series(pd.Categorical(["low", "m", "h", "vh"], categories=["low", "m", "h", "vh"], ordered=True)), 
-                "ord_cat_none": pd.Series(pd.Categorical(["low", "m", "h", None], categories=["low", "m", "h"], ordered=True)), 
-                "ord_int": pd.Series([0, 1, 2, 3]), 
-                "ord_float": pd.Series([2.0, 3.0, 4.5, 6.5]),
-                "ord_float_nan": pd.Series([2.0, 3.0, 4.5, np.nan]),
-                "ord_cat_shuff": pd.Series(pd.Categorical(["m", "h", "vh", "low"], categories=["low", "m", "h", "vh"], ordered=True)), 
+                "ord_cat": Series(
+                    pd.Categorical(
+                        ["low", "m", "h", "vh"],
+                        categories=["low", "m", "h", "vh"],
+                        ordered=True,
+                    )
+                ),
+                "ord_cat_none": Series(
+                    pd.Categorical(
+                        ["low", "m", "h", None],
+                        categories=["low", "m", "h"],
+                        ordered=True,
+                    )
+                ),
+                "ord_int": Series([0, 1, 2, 3]),
+                "ord_float": Series([2.0, 3.0, 4.5, 6.5]),
+                "ord_float_nan": Series([2.0, 3.0, 4.5, np.nan]),
+                "ord_cat_shuff": Series(
+                    pd.Categorical(
+                        ["m", "h", "vh", "low"],
+                        categories=["low", "m", "h", "vh"],
+                        ordered=True,
+                    )
+                ),
+                "ord_int_shuff": Series([2, 3, 0, 1]),
             }
         )
         corr_calc = df.corr(method=method)
-        for col1, col2 in combinations(["ord_cat", "ord_int", "ord_float"], r=2):
-            expected = df[col1].corr(df[col2], method=method)
-            tm.assert_almost_equal(corr_calc[col1][col2], expected)
-
+        for col1, col2 in combinations(df.columns, r=2):
+            corr_expected = df[col1].corr(df[col2], method=method)
+            tm.assert_almost_equal(corr_calc[col1][col2], corr_expected)
 
 
 class TestDataFrameCorrWith:
@@ -512,3 +534,49 @@ def test_cov_with_missing_values(self):
         result2 = df.dropna().cov()
         tm.assert_frame_equal(result1, expected)
         tm.assert_frame_equal(result2, expected)
+
+    @pytest.mark.parametrize("method", ["kendall", "spearman"])
+    def test_corr_rank_ordered_categorical(
+        self,
+        method,
+    ):
+        df1 = DataFrame(
+            {
+                "a": Series(
+                    pd.Categorical(
+                        ["low", "m", "h", "vh"],
+                        categories=["low", "m", "h", "vh"],
+                        ordered=True,
+                    )
+                ),
+                "b": Series(
+                    pd.Categorical(
+                        ["low", "m", "h", None],
+                        categories=["low", "m", "h"],
+                        ordered=True,
+                    )
+                ),
+                "c": Series([0, 1, 2, 3]),
+                "d": Series([2.0, 3.0, 4.5, 6.5]),
+            }
+        )
+
+        df2 = DataFrame(
+            {
+                "a": Series([2.0, 3.0, 4.5, np.nan]),
+                "b": Series(
+                    pd.Categorical(
+                        ["m", "h", "vh", "low"],
+                        categories=["low", "m", "h", "vh"],
+                        ordered=True,
+                    )
+                ),
+                "c": Series([2, 3, 0, 1]),
+                "d": Series([2.0, 3.0, 4.5, 6.5]),
+            }
+        )
+
+        corr_calc = df1.corrwith(df2, method=method)
+        for col in df1.columns:
+            corr_expected = df1[col].corr(df2[col], method=method)
+            tm.assert_almost_equal(corr_calc.get(col), corr_expected)
diff --git a/pandas/tests/series/methods/test_cov_corr.py b/pandas/tests/series/methods/test_cov_corr.py
@@ -11,6 +11,7 @@
 )
 import pandas._testing as tm
 
+
 class TestSeriesCov:
     def test_cov(self, datetime_series):
         # full overlap
@@ -183,54 +184,77 @@ def test_corr_callable_method(self, datetime_series):
         df = pd.DataFrame([s1, s2])
         expected = pd.DataFrame([{0: 1.0, 1: 0}, {0: 0, 1: 1.0}])
         tm.assert_almost_equal(df.transpose().corr(method=my_corr), expected)
-    
+
     @pytest.mark.parametrize("method", ["kendall", "spearman"])
-    def test_corr_rank_ordered_categorical(self, method,):
+    def test_corr_rank_ordered_categorical(
+        self,
+        method,
+    ):
         stats = pytest.importorskip("scipy.stats")
-        method_scipy_func = {
-            "kendall": stats.kendalltau,
-            "spearman": stats.spearmanr
-        }
-        ser_ord_cat = pd.Series( pd.Categorical(
-             ["low", "med", "high", "very_high"], 
-             categories=["low", "med", "high", "very_high"], ordered=True
-             ))
+        method_scipy_func = {"kendall": stats.kendalltau, "spearman": stats.spearmanr}
+        ser_ord_cat = Series(
+            pd.Categorical(
+                ["low", "med", "high", "very_high"],
+                categories=["low", "med", "high", "very_high"],
+                ordered=True,
+            )
+        )
         ser_ord_cat_codes = ser_ord_cat.cat.codes.replace(-1, np.nan)
-        ser_ord_int = pd.Series([0, 1, 2, 3])
-        ser_ord_float = pd.Series([2.0, 3.0, 4.5, 6.5])
-    
+        ser_ord_int = Series([0, 1, 2, 3])
+        ser_ord_float = Series([2.0, 3.0, 4.5, 6.5])
+
         corr_calc = ser_ord_cat.corr(ser_ord_int, method=method)
-        corr_expected = method_scipy_func[method](ser_ord_cat_codes, ser_ord_int, nan_policy="omit")[0]
+        corr_expected = method_scipy_func[method](
+            ser_ord_cat_codes, ser_ord_int, nan_policy="omit"
+        )[0]
         tm.assert_almost_equal(corr_calc, corr_expected)
 
         corr_calc = ser_ord_cat.corr(ser_ord_float, method=method)
-        corr_expected = method_scipy_func[method](ser_ord_cat_codes, ser_ord_float, nan_policy="omit")[0]
+        corr_expected = method_scipy_func[method](
+            ser_ord_cat_codes, ser_ord_float, nan_policy="omit"
+        )[0]
         tm.assert_almost_equal(corr_calc, corr_expected)
 
         corr_calc = ser_ord_cat.corr(ser_ord_cat, method=method)
-        corr_expected = method_scipy_func[method](ser_ord_cat_codes, ser_ord_cat_codes, nan_policy="omit")[0]
+        corr_expected = method_scipy_func[method](
+            ser_ord_cat_codes, ser_ord_cat_codes, nan_policy="omit"
+        )[0]
         tm.assert_almost_equal(corr_calc, corr_expected)
 
-        ser_ord_cat_shuff = pd.Series( pd.Categorical(
-             ["high", "low", "very_high", "med"], 
-             categories=["low", "med", "high", "very_high"], ordered=True
-             ))
+        ser_ord_cat_shuff = Series(
+            pd.Categorical(
+                ["high", "low", "very_high", "med"],
+                categories=["low", "med", "high", "very_high"],
+                ordered=True,
+            )
+        )
         ser_ord_cat_shuff_codes = ser_ord_cat_shuff.cat.codes.replace(-1, np.nan)
-        
+
         corr_calc = ser_ord_cat_shuff.corr(ser_ord_cat, method=method)
-        corr_expected = method_scipy_func[method](ser_ord_cat_shuff_codes, ser_ord_cat_codes, nan_policy="omit")[0]
+        corr_expected = method_scipy_func[method](
+            ser_ord_cat_shuff_codes, ser_ord_cat_codes, nan_policy="omit"
+        )[0]
         tm.assert_almost_equal(corr_calc, corr_expected)
 
         corr_calc = ser_ord_cat_shuff.corr(ser_ord_cat_shuff, method=method)
-        corr_expected = method_scipy_func[method](ser_ord_cat_shuff_codes, ser_ord_cat_shuff_codes, nan_policy="omit")[0]
+        corr_expected = method_scipy_func[method](
+            ser_ord_cat_shuff_codes, ser_ord_cat_shuff_codes, nan_policy="omit"
+        )[0]
         tm.assert_almost_equal(corr_calc, corr_expected)
-        
-        ser_ord_cat_with_nan = pd.Series( pd.Categorical(
-             ["h", "low", "vh", None, "m"], 
-             categories=["low", "m", "h", "vh"], ordered=True
-             ))
-        ser_ord_cat_shuff_with_nan_codes = ser_ord_cat_with_nan.cat.codes.replace(-1, np.nan)
-        ser_ord_int = pd.Series([2, 0, 1, 3, None])
+
+        ser_ord_cat_with_nan = Series(
+            pd.Categorical(
+                ["h", "low", "vh", None, "m"],
+                categories=["low", "m", "h", "vh"],
+                ordered=True,
+            )
+        )
+        ser_ord_cat_shuff_with_nan_codes = ser_ord_cat_with_nan.cat.codes.replace(
+            -1, np.nan
+        )
+        ser_ord_int = Series([2, 0, 1, 3, None])
         corr_calc = ser_ord_cat_with_nan.corr(ser_ord_int, method=method)
-        corr_expected = method_scipy_func[method](ser_ord_cat_shuff_with_nan_codes, ser_ord_int, nan_policy="omit")[0]
-        tm.assert_almost_equal(corr_calc, corr_expected)
+        corr_expected = method_scipy_func[method](
+            ser_ord_cat_shuff_with_nan_codes, ser_ord_int, nan_policy="omit"
+        )[0]
+        tm.assert_almost_equal(corr_calc, corr_expected)
diff --git a/test_corr.py b/test_corr.py
@@ -1,23 +1,27 @@
 import pandas as pd
-df = pd.DataFrame({'a' : [1, 2, 3, 4], 'b' : [4, 3, 2, 1]})
-df['b'] = df['b'].astype('category').cat.set_categories([4, 3, 2, 1], ordered=True)
-#import pdb; pdb.set_trace()
-crr = df.corr(method='spearman')
+
+df = pd.DataFrame({"a": [1, 2, 3, 4], "b": [4, 3, 2, 1]})
+df["b"] = df["b"].astype("category").cat.set_categories([4, 3, 2, 1], ordered=True)
+# import pdb; pdb.set_trace()
+crr = df.corr(method="spearman")
 print(crr)
 
 
-df = pd.DataFrame({'a' : [1, 2, 3, 4], 'b' : ["vh", "h", "m", "l"]})
-df['b'] = df['b'].astype('category').cat.set_categories(["vh", "h", "m", "l"], ordered=True)
-#import pdb; pdb.set_trace()
+df = pd.DataFrame({"a": [1, 2, 3, 4], "b": ["vh", "h", "m", "l"]})
+df["b"] = (
+    df["b"].astype("category").cat.set_categories(["vh", "h", "m", "l"], ordered=True)
+)
+# import pdb; pdb.set_trace()
 print(df)
 print(df.dtypes)
-crr = df.corr(method='spearman')
+crr = df.corr(method="spearman")
 print(crr)
 
-ser_ord_cat = pd.Series( pd.Categorical(
-             ["vh", "h", "m", "low"], 
-             categories=["vh", "h", "m", "low"], ordered=True
-             ))
+ser_ord_cat = pd.Series(
+    pd.Categorical(
+        ["vh", "h", "m", "low"], categories=["vh", "h", "m", "low"], ordered=True
+    )
+)
 print(ser_ord_cat)
-crr = ser_ord_cat.corr(ser_ord_cat, method='spearman')
-print(crr)
+crr = ser_ord_cat.corr(ser_ord_cat, method="spearman")
+print(crr)