Skip to content

Commit ec93df0

Browse files
committed
Update benchmarking scopes
1 parent 1103aad commit ec93df0

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

44 files changed

+1405
-534
lines changed

configs/common/dbscan.json

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
{
2+
"PARAMETERS_SETS": {
3+
"common dbscan parameters": {
4+
"algorithm": {
5+
"estimator": "DBSCAN",
6+
"estimator_params": {
7+
"eps": "[SPECIAL_VALUE]distances_quantile:0.01",
8+
"min_samples": 5,
9+
"metric": "euclidean"
10+
}
11+
}
12+
},
13+
"sklearn dbscan parameters": {
14+
"algorithm": {
15+
"estimator_params": {
16+
"algorithm": "brute",
17+
"n_jobs": "[SPECIAL_VALUE]physical_cpus"
18+
}
19+
}
20+
},
21+
"cuml dbscan parameters": {
22+
"algorithm": {
23+
"estimator_params": { "calc_core_sample_indices": false, "verbose": 2 }
24+
}
25+
}
26+
}
27+
}

configs/common/ensemble.json

Lines changed: 64 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,64 @@
1+
{
2+
"PARAMETERS_SETS": {
3+
"common ensemble params": {
4+
"algorithm": {
5+
"estimator_params": {
6+
"n_estimators": 500,
7+
"max_depth": 12,
8+
"max_samples": 0.8,
9+
"min_samples_split": 5,
10+
"min_samples_leaf": 2,
11+
"min_impurity_decrease": 0.0,
12+
"bootstrap": true,
13+
"random_state": 42
14+
}
15+
}
16+
},
17+
"sklearn ensemble classifier params": {
18+
"algorithm": {
19+
"estimator": ["RandomForestClassifier", "ExtraTreesClassifier"],
20+
"estimator_params": {
21+
"criterion": "gini",
22+
"max_features": "sqrt",
23+
"max_leaf_nodes": null,
24+
"n_jobs": "[SPECIAL_VALUE]physical_cpus"
25+
}
26+
}
27+
},
28+
"sklearn ensemble regressor params": {
29+
"algorithm": {
30+
"estimator": ["RandomForestRegressor", "ExtraTreesRegressor"],
31+
"estimator_params": {
32+
"criterion": "squared_error",
33+
"max_features": 1.0,
34+
"max_leaf_nodes": null,
35+
"n_jobs": "[SPECIAL_VALUE]physical_cpus"
36+
}
37+
}
38+
},
39+
"cuml ensemble classifier params": {
40+
"algorithm": {
41+
"estimator": "RandomForestClassifier",
42+
"estimator_params": {
43+
"n_streams": 4,
44+
"split_criterion": "gini",
45+
"max_features": "sqrt",
46+
"max_leaves": -1,
47+
"n_bins": 256
48+
}
49+
}
50+
},
51+
"cuml ensemble regressor params": {
52+
"algorithm": {
53+
"estimator": "RandomForestRegressor",
54+
"estimator_params": {
55+
"n_streams": 4,
56+
"split_criterion": "mse",
57+
"max_features": 1.0,
58+
"max_leaves": -1,
59+
"n_bins": 256
60+
}
61+
}
62+
}
63+
}
64+
}

configs/common/kmeans.json

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
{
2+
"PARAMETERS_SETS": {
3+
"common kmeans parameters": {
4+
"algorithm": {
5+
"estimator": "KMeans",
6+
"estimator_params": {
7+
"n_clusters": "[SPECIAL_VALUE]auto",
8+
"n_init": 1,
9+
"max_iter": 30,
10+
"tol": 1e-3,
11+
"random_state": 42
12+
},
13+
"estimator_methods": { "inference": "predict" }
14+
}
15+
},
16+
"sklearn kmeans parameters": {
17+
"algorithm": { "estimator_params": { "init": "k-means++", "algorithm": "lloyd" } }
18+
},
19+
"cuml kmeans parameters": {
20+
"algorithm": {
21+
"estimator_params": { "init": "scalable-k-means++" }
22+
}
23+
}
24+
}
25+
}

configs/common/knn.json

Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,42 @@
1+
{
2+
"PARAMETERS_SETS": {
3+
"common knn parameters": {
4+
"algorithm": {
5+
"estimator_params": {
6+
"n_neighbors": [10, 100],
7+
"weights": "uniform"
8+
}
9+
},
10+
"data": {
11+
"preprocessing_kwargs": { "normalize": true }
12+
}
13+
},
14+
"sklearn knn parameters": {
15+
"algorithm": { "estimator_params": { "n_jobs": "[SPECIAL_VALUE]physical_cpus" } }
16+
},
17+
"brute knn classification parameters": {
18+
"algorithm": {
19+
"estimator": "KNeighborsClassifier",
20+
"estimator_params": { "algorithm": "brute", "metric": "minkowski", "p": [1, 2] }
21+
}
22+
},
23+
"kd_tree knn classification parameters": {
24+
"algorithm": {
25+
"estimator": "KNeighborsClassifier",
26+
"estimator_params": { "algorithm": "kd_tree", "metric": "minkowski", "p": 2 }
27+
}
28+
},
29+
"brute knn regression parameters": {
30+
"algorithm": {
31+
"estimator": "KNeighborsRegressor",
32+
"estimator_params": { "algorithm": "brute", "metric": "minkowski", "p": [1, 2] }
33+
}
34+
},
35+
"kd_tree knn regression parameters": {
36+
"algorithm": {
37+
"estimator": "KNeighborsRegressor",
38+
"estimator_params": { "algorithm": "kd_tree", "metric": "minkowski", "p": 2 }
39+
}
40+
}
41+
}
42+
}

configs/common/lightgbm.json

Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
{
2+
"PARAMETERS_SETS": {
3+
"lightgbm implementations": [
4+
{
5+
"algorithm": {
6+
"device": "cpu",
7+
"estimator_params": {
8+
"boosting_type": "gbdt",
9+
"verbosity": -1,
10+
"n_jobs": "[SPECIAL_VALUE]physical_cpus"
11+
},
12+
"enable_modelbuilders": false
13+
}
14+
}
15+
],
16+
"lightgbm binary classification": {
17+
"algorithm": {
18+
"library": "lightgbm",
19+
"estimator": "LGBMClassifier",
20+
"estimator_params": {
21+
"objective": "binary"
22+
}
23+
}
24+
},
25+
"lightgbm multi classification": {
26+
"algorithm": {
27+
"library": "lightgbm",
28+
"estimator": "LGBMClassifier",
29+
"estimator_params": {
30+
"objective": "multiclass",
31+
"num_classes": "[SPECIAL_VALUE]auto"
32+
}
33+
}
34+
},
35+
"lightgbm regression": {
36+
"algorithm": {
37+
"library": "lightgbm",
38+
"estimator": "LGBMRegressor",
39+
"estimator_params": {
40+
"objective": "regression"
41+
}
42+
}
43+
}
44+
}
45+
}

configs/common/linear_model.json

Lines changed: 56 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,56 @@
1+
{
2+
"PARAMETERS_SETS": {
3+
"common linear parameters": {
4+
"algorithm": {
5+
"estimator": "LinearRegression",
6+
"estimator_params": { "fit_intercept": true, "copy_X": true }
7+
}
8+
},
9+
"common ridge parameters": {
10+
"algorithm": {
11+
"estimator": "Ridge",
12+
"estimator_params": {
13+
"fit_intercept": true,
14+
"alpha": 2.0
15+
}
16+
}
17+
},
18+
"common lasso parameters": {
19+
"algorithm": {
20+
"estimator": "Lasso",
21+
"estimator_params": {
22+
"fit_intercept": true,
23+
"max_iter": 1000,
24+
"selection": "cyclic",
25+
"alpha": 1e-3,
26+
"tol": 1e-6
27+
}
28+
}
29+
},
30+
"common elasticnet parameters": {
31+
"algorithm": {
32+
"estimator": "ElasticNet",
33+
"estimator_params": {
34+
"fit_intercept": true,
35+
"max_iter": 1000,
36+
"selection": "cyclic",
37+
"alpha": 1e-3,
38+
"l1_ratio": 0.9,
39+
"tol": 1e-6
40+
}
41+
}
42+
},
43+
"sklearn linear parameters": {
44+
"estimator_params": { "n_jobs": "[SPECIAL_VALUE]physical_cpus" }
45+
},
46+
"sklearn ridge parameters": {
47+
"estimator_params": { "solver": "auto", "tol": 1e-4 }
48+
},
49+
"cuml L2 parameters": {
50+
"estimator_params": { "solver": "eig" }
51+
},
52+
"cuml L1 parameters": {
53+
"estimator_params": { "solver": "cd" }
54+
}
55+
}
56+
}

configs/common/logreg.json

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,29 @@
1+
{
2+
"INCLUDE": ["../common/sklearn.json"],
3+
"PARAMETERS_SETS": {
4+
"common logreg parameters": {
5+
"algorithm": {
6+
"estimator": "LogisticRegression",
7+
"estimator_methods": { "inference": "predict" },
8+
"estimator_params": {
9+
"penalty": "l2",
10+
"tol": 1e-4,
11+
"C": 1.0,
12+
"l1_ratio": null,
13+
"max_iter": 200
14+
}
15+
}
16+
},
17+
"sklearn logreg parameters": {
18+
"algorithm": {
19+
"estimator_params": {
20+
"solver": "lbfgs",
21+
"random_state": 42
22+
}
23+
}
24+
},
25+
"cuml logreg parameters": {
26+
"algorithm": { "estimator_params": { "solver": "qn" } }
27+
}
28+
}
29+
}

configs/common/pca.json

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
{
2+
"INCLUDE": ["../common/sklearn.json"],
3+
"PARAMETERS_SETS": {
4+
"pca parameters": {
5+
"algorithm": {
6+
"estimator": "PCA",
7+
"estimator_params": {
8+
"n_components": 3,
9+
"copy": true,
10+
"whiten": false,
11+
"svd_solver": "covariance_eigh",
12+
"tol": 0.0,
13+
"iterated_power": 15,
14+
"random_state": 42
15+
}
16+
}
17+
},
18+
"cuml pca parameters": {
19+
"algorithm": {
20+
"estimator_params": {
21+
"svd_solver": "full",
22+
"random_state": "[REMOVE]"
23+
}
24+
}
25+
}
26+
}
27+
}

configs/common/sklearn.json

Lines changed: 13 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -12,13 +12,6 @@
1212
{ "library": "sklearnex", "device": ["cpu", "gpu"] }
1313
]
1414
},
15-
"sklearn-ex[preview] implementations": {
16-
"algorithm": [
17-
{ "library": "sklearn", "device": "cpu" },
18-
{ "library": "sklearnex", "device": "cpu" },
19-
{ "library": "sklearnex.preview", "device": ["cpu", "gpu"] }
20-
]
21-
},
2215
"sklearnex spmd implementation": {
2316
"algorithm": {
2417
"library": "sklearnex.spmd",
@@ -50,7 +43,19 @@
5043
},
5144
"cuml implementation": {
5245
"algorithm": { "library": "cuml" },
53-
"data": { "format": "cudf" }
46+
"data": { "format": "cupy" }
47+
},
48+
"extended data formats": {
49+
"data": [
50+
{
51+
"format": "numpy",
52+
"order": "C"
53+
},
54+
{
55+
"format": "pandas",
56+
"order": "F"
57+
}
58+
]
5459
}
5560
}
5661
}

0 commit comments

Comments
 (0)