Quick-fix (#539)

* fix doc string; enable label transform in automl.score
This commit is contained in:
Qiaochu Song
2022-05-19 11:43:34 -04:00
committed by GitHub
parent 7126b69ce0
commit 2851134052
3 changed files with 60 additions and 4 deletions

View File

@@ -848,6 +848,8 @@ class AutoML(BaseEstimator):
)
return None
X = self._preprocess(X)
if self._label_transformer:
y = self._label_transformer.transform(y)
return estimator.score(X, y, **kwargs)
def predict(

View File

@@ -384,13 +384,9 @@ class DataTransformer:
Args:
X: A numpy array or a pandas dataframe of training data.
y: A numpy array or a pandas series of labels.
task: A string of the task type, e.g.,
'classification', 'regression', 'ts_forecast', 'rank'.
Returns:
X: Processed numpy array or pandas dataframe of training data.
y: Processed numpy array or pandas series of labels.
"""
X = X.copy()

View File

@@ -212,6 +212,64 @@ class TestScore:
except NotImplementedError:
pass
def test_class(self):
# to test classification task with labels need encoding
X = pd.DataFrame(
{
"f1": [1, -2, 3, -4, 5, -6, -7, 8, -9, -10, -11, -12, -13, -14],
"f2": [
3.0,
16.0,
10.0,
12.0,
3.0,
14.0,
11.0,
12.0,
5.0,
14.0,
20.0,
16.0,
15.0,
11.0,
],
}
)
y = pd.Series(
[
"a",
"b",
"c",
"d",
"a",
"b",
"c",
"d",
"a",
"b",
"c",
"d",
"a",
"b",
]
)
automl = AutoML()
automl_settings = {
"time_budget": 6,
"task": "classification",
"n_jobs": 1,
"estimator_list": ["xgboost"],
"metric": "accuracy",
"log_training_metric": True,
}
automl.fit(X, y, **automl_settings)
assert automl._label_transformer is not None
assert automl.score(X, y) > 0
automl.pickle("automl.pkl")
if __name__ == "__main__":
test = TestScore()