in python/pipelines/components/python/component.py [0:0]
def _create_model(params):
logging.info(f"Creating model with params: {params}")
numeric_transformer = Pipeline(steps=[
('imputer', SimpleImputer(strategy='median')),
('scaler', StandardScaler())
])
categorical_transformer = Pipeline(steps=[
('imputer', SimpleImputer(strategy='most_frequent')),
#('tfidf', TfidfTransformer(norm='l2'))
('onehot', OneHotEncoder(sparse_output=False))
])
model = Pipeline([
('transform', ColumnTransformer(
transformers=[
('num', numeric_transformer, selector(dtype_exclude=object)),
('cat', categorical_transformer, selector(dtype_include=object))
]
)),
('model', KMeans(
init='k-means++', n_init='auto',
random_state=42,
**params)
)
])
return model