IntelPython · Alexsandruss · Apr 28, 2025
@@ -0,0 +1,27 @@
+{
+    "PARAMETERS_SETS": {
+        "common dbscan parameters": {
+            "algorithm": {
+                "estimator": "DBSCAN",
+                "estimator_params": {
+                    "eps": "[SPECIAL_VALUE]distances_quantile:0.01",
+                    "min_samples": 5,
+                    "metric": "euclidean"
+                }
+            }
+        },
+        "sklearn dbscan parameters": {
+            "algorithm": {
+                "estimator_params": {
+                    "algorithm": "brute",
+                    "n_jobs": "[SPECIAL_VALUE]physical_cpus"
+                }
+            }
+        },
+        "cuml dbscan parameters": {
+            "algorithm": {
+                "estimator_params": { "calc_core_sample_indices": false, "verbose": 2 }
+            }
+        }
+    }
+}
@@ -0,0 +1,64 @@
+{
+    "PARAMETERS_SETS": {
+        "common ensemble params": {
+            "algorithm": {
+                "estimator_params": {
+                    "n_estimators": 500,
+                    "max_depth": 12,
+                    "max_samples": 0.8,
+                    "min_samples_split": 5,
+                    "min_samples_leaf": 2,
+                    "min_impurity_decrease": 0.0,
+                    "bootstrap": true,
+                    "random_state": 42
+                }
+            }
+        },
+        "sklearn ensemble classifier params": {
+            "algorithm": {
+                "estimator": ["RandomForestClassifier", "ExtraTreesClassifier"],
+                "estimator_params": {
+                    "criterion": "gini",
+                    "max_features": "sqrt",
+                    "max_leaf_nodes": null,
+                    "n_jobs": "[SPECIAL_VALUE]physical_cpus"
+                }
+            }
+        },
+        "sklearn ensemble regressor params": {
+            "algorithm": {
+                "estimator": ["RandomForestRegressor", "ExtraTreesRegressor"],
+                "estimator_params": {
+                    "criterion": "squared_error",
+                    "max_features": 1.0,
+                    "max_leaf_nodes": null,
+                    "n_jobs": "[SPECIAL_VALUE]physical_cpus"
+                }
+            }
+        },
+        "cuml ensemble classifier params": {
+            "algorithm": {
+                "estimator": "RandomForestClassifier",
+                "estimator_params": {
+                    "n_streams": 4,
+                    "split_criterion": "gini",
+                    "max_features": "sqrt",
+                    "max_leaves": -1,
+                    "n_bins": 256
+                }
+            }
+        },
+        "cuml ensemble regressor params": {
+            "algorithm": {
+                "estimator": "RandomForestRegressor",
+                "estimator_params": {
+                    "n_streams": 4,
+                    "split_criterion": "mse",
+                    "max_features": 1.0,
+                    "max_leaves": -1,
+                    "n_bins": 256
+                }
+            }
+        }
+    }
+}
@@ -0,0 +1,25 @@
+{
+    "PARAMETERS_SETS": {
+        "common kmeans parameters": {
+            "algorithm": {
+                "estimator": "KMeans",
+                "estimator_params": {
+                    "n_clusters": "[SPECIAL_VALUE]auto",
+                    "n_init": 1,
+                    "max_iter": 30,
+                    "tol": 1e-3,
+                    "random_state": 42
+                },
+                "estimator_methods": { "inference": "predict" }
+            }
+        },
+        "sklearn kmeans parameters": {
+            "algorithm": { "estimator_params": { "init": "k-means++", "algorithm": "lloyd" } }
+        },
+        "cuml kmeans parameters": {
+            "algorithm": {
+                "estimator_params": { "init": "scalable-k-means++" }
+            }
+        }
+    }
+}
@@ -0,0 +1,42 @@
+{
+    "PARAMETERS_SETS": {
+        "common knn parameters": {
+            "algorithm": {
+                "estimator_params": {
+                    "n_neighbors": [10, 100],
+                    "weights": "uniform"
+                }
+            },
+            "data": {
+                "preprocessing_kwargs": { "normalize": true }
+            }
+        },
+        "sklearn knn parameters": {
+            "algorithm": { "estimator_params": { "n_jobs": "[SPECIAL_VALUE]physical_cpus" } }
+        },
+        "brute knn classification parameters": {
+            "algorithm": {
+                "estimator": "KNeighborsClassifier",
+                "estimator_params": { "algorithm": "brute", "metric": "minkowski", "p": [1, 2] }
+            }
+        },
+        "kd_tree knn classification parameters": {
+            "algorithm": {
+                "estimator": "KNeighborsClassifier",
+                "estimator_params": { "algorithm": "kd_tree", "metric": "minkowski", "p": 2 }
+            }
+        },
+        "brute knn regression parameters": {
+            "algorithm": {
+                "estimator": "KNeighborsRegressor",
+                "estimator_params": { "algorithm": "brute", "metric": "minkowski", "p": [1, 2] }
+            }
+        },
+        "kd_tree knn regression parameters": {
+            "algorithm": {
+                "estimator": "KNeighborsRegressor",
+                "estimator_params": { "algorithm": "kd_tree", "metric": "minkowski", "p": 2 }
+            }
+        }
+    }
+}
@@ -0,0 +1,45 @@
+{
+    "PARAMETERS_SETS": {
+        "lightgbm implementations": [
+            {
+                "algorithm": {
+                    "device": "cpu",
+                    "estimator_params": {
+                        "boosting_type": "gbdt",
+                        "verbosity": -1,
+                        "n_jobs": "[SPECIAL_VALUE]physical_cpus"
+                    },
+                    "enable_modelbuilders": false
+                }
+            }
+        ],
+        "lightgbm binary classification": {
+            "algorithm": {
+                "library": "lightgbm",
+                "estimator": "LGBMClassifier",
+                "estimator_params": {
+                    "objective": "binary"
+                }
+            }
+        },
+        "lightgbm multi classification": {
+            "algorithm": {
+                "library": "lightgbm",
+                "estimator": "LGBMClassifier",
+                "estimator_params": {
+                    "objective": "multiclass",
+                    "num_classes": "[SPECIAL_VALUE]auto"
+                }
+            }
+        },
+        "lightgbm regression": {
+            "algorithm": {
+                "library": "lightgbm",
+                "estimator": "LGBMRegressor",
+                "estimator_params": {
+                    "objective": "regression"
+                }
+            }
+        }
+    }
+}
@@ -0,0 +1,56 @@
+{
+    "PARAMETERS_SETS": {
+        "common linear parameters": {
+            "algorithm": {
+                "estimator": "LinearRegression",
+                "estimator_params": { "fit_intercept": true, "copy_X": true }
+            }
+        },
+        "common ridge parameters": {
+            "algorithm": {
+                "estimator": "Ridge",
+                "estimator_params": {
+                    "fit_intercept": true,
+                    "alpha": 2.0
+                }
+            }
+        },
+        "common lasso parameters": {
+            "algorithm": {
+                "estimator": "Lasso",
+                "estimator_params": {
+                    "fit_intercept": true,
+                    "max_iter": 1000,
+                    "selection": "cyclic",
+                    "alpha": 1e-3,
+                    "tol": 1e-6
+                }
+            }
+        },
+        "common elasticnet parameters": {
+            "algorithm": {
+                "estimator": "ElasticNet",
+                "estimator_params": {
+                    "fit_intercept": true,
+                    "max_iter": 1000,
+                    "selection": "cyclic",
+                    "alpha": 1e-3,
+                    "l1_ratio": 0.9,
+                    "tol": 1e-6
+                }
+            }
+        },
+        "sklearn linear parameters": {
+            "estimator_params": { "n_jobs": "[SPECIAL_VALUE]physical_cpus" }
+        },
+        "sklearn ridge parameters": {
+            "estimator_params": { "solver": "auto", "tol": 1e-4 }
+        },
+        "cuml L2 parameters": {
+            "estimator_params": { "solver": "eig" }
+        },
+        "cuml L1 parameters": {
+            "estimator_params": { "solver": "cd" }
+        }
+    }
+}
@@ -0,0 +1,29 @@
+{
+    "INCLUDE": ["../common/sklearn.json"],
+    "PARAMETERS_SETS": {
+        "common logreg parameters": {
+            "algorithm": {
+                "estimator": "LogisticRegression",
+                "estimator_methods": { "inference": "predict" },
+                "estimator_params": {
+                    "penalty": "l2",
+                    "tol": 1e-4,
+                    "C": 1.0,
+                    "l1_ratio": null,
+                    "max_iter": 200
+                }
+            }
+        },
+        "sklearn logreg parameters": {
+            "algorithm": {
+                "estimator_params": {
+                    "solver": "lbfgs",
+                    "random_state": 42
+                }
+            }
+        },
+        "cuml logreg parameters": {
+            "algorithm": { "estimator_params": { "solver": "qn" } }
+        }
+    }
+}
@@ -0,0 +1,27 @@
+{
+    "INCLUDE": ["../common/sklearn.json"],
+    "PARAMETERS_SETS": {
+        "pca parameters": {
+            "algorithm": {
+                "estimator": "PCA",
+                "estimator_params": {
+                    "n_components": 3,
+                    "copy": true,
+                    "whiten": false,
+                    "svd_solver": "covariance_eigh",
+                    "tol": 0.0,
+                    "iterated_power": 15,
+                    "random_state": 42
+                }
+            }
+        },
+        "cuml pca parameters": {
+            "algorithm": {
+                "estimator_params": {
+                    "svd_solver": "full",
+                    "random_state": "[REMOVE]"
+                }
+            }
+        }
+    }
+}
@@ -12,13 +12,6 @@
                 { "library": "sklearnex", "device": ["cpu", "gpu"] }
             ]
         },
-        "sklearn-ex[preview] implementations": {
-            "algorithm": [
-                { "library": "sklearn", "device": "cpu" },
-                { "library": "sklearnex", "device": "cpu" },
-                { "library": "sklearnex.preview", "device": ["cpu", "gpu"] }
-            ]
-        },
         "sklearnex spmd implementation": {
             "algorithm": {
                 "library": "sklearnex.spmd",
@@ -50,7 +43,19 @@
         },
         "cuml implementation": {
             "algorithm": { "library": "cuml" },
-            "data": { "format": "cudf" }
+            "data": { "format": "cupy" }
+        },
+        "extended data formats": {
+            "data": [
+                {
+                    "format": "numpy",
+                    "order": "C"
+                },
+                {
+                    "format": "pandas",
+                    "order": "F"
+                }
+            ]
         }
     }
 }