In [49]:
from test.data.datasets import get_dataset
from fedot.api.main import Fedot
import numpy as np
import pandas as pd
import string
from fedot.core.pipelines.pipeline_builder import PipelineBuilder

import cProfile
import pstats
from pstats import SortKey

from sklearn.datasets import make_regression
from sklearn.model_selection import train_test_split

df = pd.DataFrame(np.random.randint(0, 100, size=(10, 10)), columns=list(string.ascii_lowercase[0:10:1]))

X, y = make_regression(n_samples=100, n_features=1, noise=1)
X_train, X_test, y_train, y_test = train_test_split(
    X, y, test_size=0.33, random_state=42)

task_type = "regression"

train_data, test_data, _ = get_dataset(task_type)

auto_model = Fedot(
    problem=task_type,
    metric=["rmse"],
    preset="best_quality",
    with_tuning=False,
    timeout=3,
    cv_folds=5,
    seed=42,
    n_jobs=1,
    initial_assumption=PipelineBuilder()
    .add_node(
        "scaling",
    )
    .add_node(
        "linear",
    )
    .build(),
    # logging_level=10,
    use_pipelines_cache=False,
    use_auto_preprocessing=False,
)


In [50]:
auto_model.fit(features=train_data)
prediction = auto_model.predict(features=test_data, save_predictions=False)

2024-12-10 21:20:24,693 - ApiComposer - Initial pipeline was fitted in 0.3 sec.
2024-12-10 21:20:24,699 - ApiComposer - Taking into account n_folds=5, estimated fit time for initial assumption is 1.6 sec.
2024-12-10 21:20:24,722 - ApiComposer - AutoML configured. Parameters tuning: False. Time limit: 3 min. Set of candidate models: ['adareg', 'catboostreg', 'dtreg', 'fast_ica', 'isolation_forest_reg', 'knnreg', 'lasso', 'lgbmreg', 'linear', 'normalization', 'pca', 'poly_features', 'ransac_lin_reg', 'ransac_non_lin_reg', 'rfr', 'ridge', 'scaling', 'sgdr', 'svr', 'xgboostreg'].
2024-12-10 21:20:24,803 - ApiComposer - Pipeline composition started.


Generations:   0%|          | 0/10000 [00:00<?, ?gen/s]

2024-12-10 21:20:25,042 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:25,200 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:25,491 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:25,858 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:26,174 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:26,319 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:26,629 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:26,787 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:27,077 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:27,223 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:27,722 - MultiprocessingDispatcher - 1 individuals out of 1 in previous population were evaluated successfully.
2024-12-10 21:20:32,576 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:32,736 - P

Generations:   0%|          | 0/10000 [02:25<?, ?gen/s]


2024-12-10 21:22:50,764 - ApiComposer - Model generation finished
2024-12-10 21:22:53,511 - FEDOT logger - Final pipeline was fitted
2024-12-10 21:22:53,517 - FEDOT logger - Final pipeline: {'depth': 2, 'length': 2, 'nodes': [linear, isolation_forest_reg]}
linear - {}
isolation_forest_reg - {}


In [None]:
auto_model.fit(features=train_data)
prediction = auto_model.predict(features=test_data, save_predictions=False)

2024-12-10 21:20:24,693 - ApiComposer - Initial pipeline was fitted in 0.3 sec.
2024-12-10 21:20:24,699 - ApiComposer - Taking into account n_folds=5, estimated fit time for initial assumption is 1.6 sec.
2024-12-10 21:20:24,722 - ApiComposer - AutoML configured. Parameters tuning: False. Time limit: 3 min. Set of candidate models: ['adareg', 'catboostreg', 'dtreg', 'fast_ica', 'isolation_forest_reg', 'knnreg', 'lasso', 'lgbmreg', 'linear', 'normalization', 'pca', 'poly_features', 'ransac_lin_reg', 'ransac_non_lin_reg', 'rfr', 'ridge', 'scaling', 'sgdr', 'svr', 'xgboostreg'].
2024-12-10 21:20:24,803 - ApiComposer - Pipeline composition started.


Generations:   0%|          | 0/10000 [00:00<?, ?gen/s]

2024-12-10 21:20:25,042 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:25,200 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:25,491 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:25,858 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:26,174 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:26,319 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:26,629 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:26,787 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:27,077 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:27,223 - PipelineObjectiveEvaluate - --- save evaluate metrics cache
2024-12-10 21:20:27,722 - MultiprocessingDispatcher - 1 individuals out of 1 in previous population were evaluated successfully.
2024-12-10 21:20:32,576 - PipelineNode - -- save fit node data_cache
2024-12-10 21:20:32,736 - P