@@ -11,11 +11,10 @@ scale across a set of classifiers and metrics. It will also use Pydra's caching
1111to not redo model training and evaluation when new metrics are added, or when
1212number of iterations (` n_splits ` ) is increased.
1313
14- Upcoming features:
15- 1 . Improve output report containing [ SHAP] ( https://github.com/slundberg/shap )
14+ 1 . Output report contains [ SHAP] ( https://github.com/slundberg/shap )
1615 feature analysis.
17- 2 . Allow for comparing scikit-learn pipelines.
18- 3 . Test on scikit-learn compatible classifiers
16+ 2 . Allows for comparing * some * scikit-learn pipelines in addition to base
17+ classifiers.
1918
2019### Installation
2120
@@ -109,6 +108,16 @@ This is a list of classifiers from scikit learn and uses an array to encode:
109108when param grid is provided and default classifier parameters are not changed,
110109then an empty dictionary ** MUST** be provided as parameter 3.
111110
111+ This can also be embedded as a list indicating a scikit-learn Pipeline. For
112+ example:
113+
114+ ```
115+ [ ["sklearn.impute", "SimpleImputer"],
116+ ["sklearn.preprocessing", "StandardScaler"],
117+ ["sklearn.tree", "DecisionTreeClassifier", {"max_depth": 5}]
118+ ]
119+ ```
120+
112121## Example specification:
113122
114123```
@@ -121,17 +130,17 @@ then an empty dictionary **MUST** be provided as parameter 3.
121130 "test_size": 0.2,
122131 "clf_info": [
123132 ["sklearn.ensemble", "AdaBoostClassifier"],
124- ["sklearn.naive_bayes", "GaussianNB"],
125133 ["sklearn.tree", "DecisionTreeClassifier", {"max_depth": 5}],
126- ["sklearn.ensemble", "RandomForestClassifier", {"n_estimators": 100}],
127- ["sklearn.ensemble", "ExtraTreesClassifier", {"n_estimators": 100, "class_weight": "balanced"}],
128- ["sklearn.linear_model", "LogisticRegressionCV", {"solver": "liblinear", "penalty": "l1"}],
129134 ["sklearn.neural_network", "MLPClassifier", {"alpha": 1, "max_iter": 1000}],
130135 ["sklearn.svm", "SVC", {"probability": true},
131136 [{"kernel": ["rbf", "linear"], "C": [1, 10, 100, 1000]}]],
132137 ["sklearn.neighbors", "KNeighborsClassifier", {},
133138 [{"n_neighbors": [3, 5, 7, 9, 11, 13, 15, 17, 19],
134- "weights": ["uniform", "distance"]}]]
139+ "weights": ["uniform", "distance"]}]],
140+ [ ["sklearn.impute", "SimpleImputer"],
141+ ["sklearn.preprocessing", "StandardScaler"],
142+ ["sklearn.tree", "DecisionTreeClassifier", {"max_depth": 5}]
143+ ]
135144 ],
136145 "permute": [true, false],
137146 "gen_shap": true,
0 commit comments