py-why · github-actions · Apr 19, 2026 · Copilot · Apr 19, 2026
diff --git a/tests/gcm/test_auto.py b/tests/gcm/test_auto.py
@@ -41,7 +41,9 @@ def _generate_non_linear_regression_data():
 
 
 def _generate_linear_classification_data():
-    X = np.random.normal(0, 1, (100, 5))
+    # 500 samples instead of 100 to give cross-validation a stable enough signal
+    # so that LogisticRegression reliably wins over SVC for linear data.
+    X = np.random.normal(0, 1, (500, 5))
     Y = (np.sum(X * np.random.uniform(-5, 5, X.shape[1]), axis=1) > 0).astype(str)
-    X = np.random.normal(0, 1, (500, 5))
-    Y = (np.sum(X * np.random.uniform(-5, 5, X.shape[1]), axis=1) > 0).astype(str)
+    rng = np.random.default_rng(0)
+    X = rng.normal(0, 1, (500, 5))
+    Y = (np.sum(X * rng.uniform(-5, 5, X.shape[1]), axis=1) > 0).astype(str)
-    X = np.random.normal(0, 1, (500, 5))
-    Y = (np.sum(X * np.random.uniform(-5, 5, X.shape[1]), axis=1) > 0).astype(str)
+    rng = np.random.default_rng(0)
+    X = rng.normal(0, 1, (500, 5))
+    Y = (np.sum(X * rng.uniform(-5, 5, X.shape[1]), axis=1) > 0).astype(str)
 
     return X, Y