Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

initial alignment of configs to final results #176

Merged
merged 12 commits into from
Mar 21, 2025
100 changes: 0 additions & 100 deletions configs/incremental.json

This file was deleted.

15 changes: 8 additions & 7 deletions configs/spmd/large_scale/basic_stats.json
Original file line number Diff line number Diff line change
Expand Up @@ -4,16 +4,17 @@
"spmd basicstats parameters": {
"algorithm": {
"estimator": "BasicStatistics",
"estimator_methods": { "training": "fit" }
"estimator_methods": { "training": "fit" },
"sklearnex_context": { "use_raw_input": true }
},
"data": {
"split_kwargs": { "test_size": 0.0001 }
}
"data": {
"split_kwargs": { "test_size": 0.0001 }
}
},
"synthetic data": {
"data": [
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 10000000, "n_features": 10, "centers": 1 } },
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 100000, "n_features": 1000, "centers": 1 } }
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 100000000, "n_features": 10, "centers": 1 } },
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 1000000, "n_features": 1000, "centers": 1 } }
]
}
},
Expand All @@ -22,7 +23,7 @@
"SETS": [
"sklearnex spmd implementation",
"large scale 2k parameters",
"synthetic data",
"synthetic data",
"spmd basicstats parameters"
]
}
Expand Down
13 changes: 7 additions & 6 deletions configs/spmd/large_scale/basic_stats_strong.json
Original file line number Diff line number Diff line change
Expand Up @@ -4,11 +4,12 @@
"spmd basicstats parameters": {
"algorithm": {
"estimator": "BasicStatistics",
"estimator_methods": { "training": "fit" }
"estimator_methods": { "training": "fit" },
"sklearnex_context": { "use_raw_input": true }
},
"data": {
"split_kwargs": { "test_size": 0.0001 }
}
"data": {
"split_kwargs": { "test_size": 0.0001 }
}
},
"synthetic data": {
"data": [
Expand All @@ -20,8 +21,8 @@
"basicstats": {
"SETS": [
"sklearnex spmd implementation",
"large scale strong 2k parameters",
"synthetic data",
"large scale strong <=64 parameters",
"synthetic data",
"spmd basicstats parameters"
]
}
Expand Down
9 changes: 5 additions & 4 deletions configs/spmd/large_scale/covariance.json
Original file line number Diff line number Diff line change
Expand Up @@ -4,16 +4,17 @@
"spmd basicstats parameters": {
"algorithm": {
"estimator": "EmpiricalCovariance",
"estimator_methods": { "training": "fit" }
"estimator_methods": { "training": "fit" },
"sklearnex_context": { "use_raw_input": true }
},
"data": {
"split_kwargs": { "test_size": 0.0001 }
}
},
"synthetic data": {
"data": [
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 10000000, "n_features": 10, "centers": 1 } },
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 100000, "n_features": 1000, "centers": 1 } }
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 100000000, "n_features": 10, "centers": 1 } },
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 1000000, "n_features": 1000, "centers": 1 } }
]
}
},
Expand All @@ -22,7 +23,7 @@
"SETS": [
"sklearnex spmd implementation",
"large scale 2k parameters",
"synthetic data",
"synthetic data",
"spmd basicstats parameters"
]
}
Expand Down
7 changes: 4 additions & 3 deletions configs/spmd/large_scale/covariance_strong.json
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,8 @@
"spmd basicstats parameters": {
"algorithm": {
"estimator": "EmpiricalCovariance",
"estimator_methods": { "training": "fit" }
"estimator_methods": { "training": "fit" },
"sklearnex_context": { "use_raw_input": true }
},
"data": {
"split_kwargs": { "test_size": 0.0001 }
Expand All @@ -20,8 +21,8 @@
"covariance": {
"SETS": [
"sklearnex spmd implementation",
"large scale strong 2k parameters",
"synthetic data",
"large scale strong <=64 parameters",
"synthetic data",
"spmd basicstats parameters"
]
}
Expand Down
5 changes: 3 additions & 2 deletions configs/spmd/large_scale/dbscan.json
Original file line number Diff line number Diff line change
Expand Up @@ -9,15 +9,16 @@
},
"estimator_params" : {
"eps": 10, "min_samples": 5
}
},
"sklearnex_context": { "use_raw_input": true }
},
"data": {
"dtype": "float64"
}
},
"synthetic dataset": {
"data": [
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 100000, "n_features": 100, "centers": 10 } }
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 40000, "n_features": 100, "centers": 10 } }
]
}
},
Expand Down
15 changes: 8 additions & 7 deletions configs/spmd/large_scale/dbscan_strong.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,21 +3,22 @@
"PARAMETERS_SETS": {
"spmd dbscan parameters": {
"algorithm": {
"estimator": "DBSCAN",
"estimator_methods": {
"training": "fit"
"estimator": "DBSCAN",
"estimator_methods": {
"training": "fit"
},
"estimator_params" : {
"eps": 10, "min_samples": 5
}
"eps": 15, "min_samples": 50
},
"sklearnex_context": { "use_raw_input": true }
},
"data": {
"dtype": "float64"
}
},
"synthetic dataset": {
"data": [
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 500000, "n_features": 100, "centers": 10 } }
{ "source": "make_blobs", "generation_kwargs": { "n_samples": 4000000, "n_features": 100, "centers": 10 } }
]
}
},
Expand All @@ -27,7 +28,7 @@
"common dbscan parameters",
"synthetic dataset",
"sklearnex spmd implementation",
"large scale strong <=64 parameters",
"large scale strong <=64 parameters",
"spmd dbscan parameters"
]
}
Expand Down
28 changes: 28 additions & 0 deletions configs/spmd/large_scale/forest_max_samples.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,28 @@
{
"INCLUDE": ["../../common/sklearn.json", "large_scale.json"],
"PARAMETERS_SETS": {
"spmd forest classification parameters": {
"algorithm": {
"estimator": "RandomForestClassifier",
"estimator_methods": { "training": "fit" },
"estimator_params": { "n_estimators": 20, "max_depth": 10 },
"sklearnex_context": { "use_raw_input": true }
}
},
"synthetic data": {
"data": [
{ "source": "make_classification", "split_kwargs": { "train_size": 1000000, "test_size": 1000 }, "generation_kwargs": { "n_samples": 1001000, "n_features": 100, "n_classes": 2 } }
]
}
},
"TEMPLATES": {
"forestCls": {
"SETS": [
"sklearnex spmd implementation",
"large scale 32 parameters",
"synthetic data",
"spmd forest classification parameters"
]
}
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -4,14 +4,13 @@
"spmd forest classification parameters": {
"algorithm": {
"estimator": "RandomForestClassifier",
"estimator_methods": { "training": "fit" },
"estimator_params": { "n_estimators": 20, "max_depth": 4 }
"estimator_params": { "n_estimators": 100, "max_depth": 7 },
"sklearnex_context": { "use_raw_input": true }
}
},
"synthetic data": {
"data": [
{ "source": "make_classification", "split_kwargs": { "train_size": 500000, "test_size": 1000 }, "generation_kwargs": { "n_samples": 501000, "n_features": 10, "n_classes": 2 } },
{ "source": "make_classification", "split_kwargs": { "train_size": 10000, "test_size": 1000 }, "generation_kwargs": { "n_samples": 11000, "n_features": 1000, "n_classes": 2 } }
{ "source": "make_classification", "split_kwargs": { "train_size": 1000000, "test_size": 1000 }, "generation_kwargs": { "n_samples": 1001000, "n_features": 100, "n_classes": 2 }, "n_informative": "[SPECIAL_VALUE]0.5" }
]
}
},
Expand All @@ -20,7 +19,7 @@
"SETS": [
"sklearnex spmd implementation",
"large scale 2k parameters",
"synthetic data",
"synthetic data",
"spmd forest classification parameters"
]
}
Expand Down
11 changes: 6 additions & 5 deletions configs/spmd/large_scale/forest_strong.json
Original file line number Diff line number Diff line change
Expand Up @@ -4,22 +4,23 @@
"spmd forest classification parameters": {
"algorithm": {
"estimator": "RandomForestClassifier",
"estimator_methods": { "training": "fit" },
"estimator_params": { "n_estimators": 20, "max_depth": 4 }
"estimator_methods": { "training": "fit" },
"estimator_params": { "n_estimators": 100, "max_depth": 8 },
"sklearnex_context": {"use_raw_input": true}
}
},
"synthetic data": {
"data": [
{ "source": "make_classification", "split_kwargs": { "train_size": 10000000, "test_size": 1000 }, "generation_kwargs": { "n_samples": 10001000, "n_features": 100, "n_classes": 2 } }
{ "source": "make_classification", "split_kwargs": { "train_size": 20000, "test_size": 1000 }, "generation_kwargs": { "n_samples": 21000, "n_features": 200, "n_classes": 2 } }
]
}
},
"TEMPLATES": {
"forestCls": {
"SETS": [
"sklearnex spmd implementation",
"large scale strong 2k parameters",
"synthetic data",
"large scale strong <=64 parameters",
"synthetic data",
"spmd forest classification parameters"
]
}
Expand Down
Loading
Loading