68c9bab4a5c6821c2a4395763c676ba796406c49,dask_ml/preprocessing/_encoders.py,OneHotEncoder,_fit,#OneHotEncoder#Any#Any#,157
Before Change
self.categories_.append(cats)
self.dtypes_.append(None)
else :
if not (X.dtypes == "category" ) .all () :
raise ValueError ("All columns must be Categorical dtype." )
if self.categories == "auto" :
for col in X.columns:
Xi = X[col]
cats = _encode(Xi, uniques=Xi.cat.categories)
self.categories_.append(cats)
self.dtypes_.append(Xi.dtype)
else :
raise ValueError (
"Cannot specify " categories" with DataFrame input. "
"Use a categorical dtype instead."
)
self.categories_ = dask.compute(self.categories_)[0 ]
def transform (
After Change
self.dtypes_.append(None)
else :
for i in range (len(X.columns) ):
Xi = X.iloc[:, i]
if self.categories != "auto" :
categories = self.categories[i]
Xi = Xi.astype(pd.CategoricalDtype(categories))
else :
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 7
Instances Project Name: dask/dask-ml
Commit Name: 68c9bab4a5c6821c2a4395763c676ba796406c49
Time: 2020-08-17
Author: TomAugspurger@users.noreply.github.com
File Name: dask_ml/preprocessing/_encoders.py
Class Name: OneHotEncoder
Method Name: _fit
Project Name: dask/dask-ml
Commit Name: 68c9bab4a5c6821c2a4395763c676ba796406c49
Time: 2020-08-17
Author: TomAugspurger@users.noreply.github.com
File Name: dask_ml/preprocessing/_encoders.py
Class Name: OneHotEncoder
Method Name: _transform
Project Name: deepgram/kur
Commit Name: 1f1adbf4aa47514d0ce857398fa0d1cb2956e267
Time: 2017-01-03
Author: ajsyp@syptech.net
File Name: kur/providers/shuffle_provider.py
Class Name: ShuffleProvider
Method Name: __init__