Source code for lale.lib.autogen.pca


from sklearn.decomposition.pca import PCA as SKLModel
import lale.helpers
import lale.operators
from numpy import nan, inf

[docs]class PCAImpl(): def __init__(self, n_components=None, copy=True, whiten=False, svd_solver='auto', tol=0.0, iterated_power='auto', random_state=None): self._hyperparams = { 'n_components': n_components, 'copy': copy, 'whiten': whiten, 'svd_solver': svd_solver, 'tol': tol, 'iterated_power': iterated_power, 'random_state': random_state}
[docs] def fit(self, X, y=None): self._sklearn_model = SKLModel(**self._hyperparams) if (y is not None): self._sklearn_model.fit(X, y) else: self._sklearn_model.fit(X) return self
[docs] def transform(self, X): return self._sklearn_model.transform(X)
_hyperparams_schema = { '$schema': 'http://json-schema.org/draft-04/schema#', 'description': 'inherited docstring for PCA Principal component analysis (PCA)', 'allOf': [{ 'type': 'object', 'required': ['n_components', 'copy', 'whiten', 'svd_solver', 'tol', 'iterated_power', 'random_state'], 'relevantToOptimizer': ['n_components', 'copy', 'whiten', 'svd_solver', 'tol', 'iterated_power'], 'additionalProperties': False, 'properties': { 'n_components': { 'anyOf': [{ 'type': 'integer', 'forOptimizer': False}, { 'type': 'number', 'minimumForOptimizer': 0.0, 'maximumForOptimizer': 1.0, 'distribution': 'uniform'}, { 'type': 'string', 'forOptimizer': False}, { 'enum': [None]}], 'default': None, 'description': 'Number of components to keep.'}, 'copy': { 'type': 'boolean', 'default': True, 'description': 'If False, data passed to fit are overwritten and running'}, 'whiten': { 'type': 'boolean', 'default': False, 'description': 'When True (False by default) the `components_` vectors are multiplied'}, 'svd_solver': { 'enum': ['arpack', 'auto', 'full', 'randomized'], 'default': 'auto', 'description': 'auto :'}, 'tol': { 'XXX TODO XXX': 'float >= 0, optional (default .0)', 'description': "Tolerance for singular values computed by svd_solver == 'arpack'.", 'type': 'number', 'minimumForOptimizer': 1e-08, 'maximumForOptimizer': 0.01, 'distribution': 'loguniform', 'default': 0.0}, 'iterated_power': { 'XXX TODO XXX': "int >= 0, or 'auto', (default 'auto')", 'description': 'Number of iterations for the power method computed by', 'anyOf': [{ 'type': 'integer', 'minimumForOptimizer': 3, 'maximumForOptimizer': 4, 'distribution': 'uniform'}, { 'enum': ['auto']}], 'default': 'auto'}, 'random_state': { 'anyOf': [{ 'type': 'integer'}, { 'type': 'object'}, { 'enum': [None]}], 'default': None, 'description': 'If int, random_state is the seed used by the random number generator;'}, }}], } _input_fit_schema = { '$schema': 'http://json-schema.org/draft-04/schema#', 'description': 'Fit the model with X.', 'type': 'object', 'properties': { 'X': { 'type': 'array', 'items': { 'type': 'array', 'items': { 'type': 'number'}, }, 'description': 'Training data, where n_samples is the number of samples'}, 'y': { }}, } _input_transform_schema = { '$schema': 'http://json-schema.org/draft-04/schema#', 'description': 'Apply dimensionality reduction to X.', 'type': 'object', 'properties': { 'X': { 'type': 'array', 'items': { 'type': 'array', 'items': { 'type': 'number'}, }, 'description': 'New data, where n_samples is the number of samples'}, }, } _output_transform_schema = { '$schema': 'http://json-schema.org/draft-04/schema#', 'description': 'Apply dimensionality reduction to X.', 'type': 'array', 'items': { 'type': 'array', 'items': { 'type': 'number'}, }, } _combined_schemas = { '$schema': 'http://json-schema.org/draft-04/schema#', 'description': 'Combined schema for expected data and hyperparameters.', 'type': 'object', 'tags': { 'pre': [], 'op': ['transformer'], 'post': []}, 'properties': { 'hyperparams': _hyperparams_schema, 'input_fit': _input_fit_schema, 'input_transform': _input_transform_schema, 'output_transform': _output_transform_schema}, } if (__name__ == '__main__'): lale.helpers.validate_is_schema(_combined_schemas) PCA = lale.operators.make_operator(PCAImpl, _combined_schemas)