freqtrade_origin/freqtrade/freqai/prediction_models/CatboostRegressorMultiTarget.py

import logging
from pathlib import Path
from typing import Any

from catboost import CatBoostRegressor, Pool

from freqtrade.freqai.base_models.BaseRegressionModel import BaseRegressionModel
from freqtrade.freqai.base_models.FreqaiMultiOutputRegressor import FreqaiMultiOutputRegressor
from freqtrade.freqai.data_kitchen import FreqaiDataKitchen


logger = logging.getLogger(__name__)


class CatboostRegressorMultiTarget(BaseRegressionModel):
    """
    User created prediction model. The class inherits IFreqaiModel, which
    means it has full access to all Frequency AI functionality. Typically,
    users would use this to override the common `fit()`, `train()`, or
    `predict()` methods to add their custom data handling tools or change
    various aspects of the training that cannot be configured via the
    top level config.json file.
    """

    def fit(self, data_dictionary: dict, dk: FreqaiDataKitchen, **kwargs) -> Any:
        """
        User sets up the training and test data to fit their desired model here
        :param data_dictionary: the dictionary holding all data for train, test,
            labels, weights
        :param dk: The datakitchen object for the current coin/model
        """

        cbr = CatBoostRegressor(
            allow_writing_files=True,
            train_dir=Path(dk.data_path),
            **self.model_training_parameters,
        )

        X = data_dictionary["train_features"]
        y = data_dictionary["train_labels"]

        sample_weight = data_dictionary["train_weights"]

        eval_sets = [None] * y.shape[1]

        if self.freqai_info.get("data_split_parameters", {}).get("test_size", 0.1) != 0:
            eval_sets = [None] * data_dictionary["test_labels"].shape[1]

            for i in range(data_dictionary["test_labels"].shape[1]):
                eval_sets[i] = Pool(
                    data=data_dictionary["test_features"],
                    label=data_dictionary["test_labels"].iloc[:, i],
                    weight=data_dictionary["test_weights"],
                )

        init_model = self.get_init_model(dk.pair)

        if init_model:
            init_models = init_model.estimators_
        else:
            init_models = [None] * y.shape[1]

        fit_params = []
        for i in range(len(eval_sets)):
            fit_params.append(
                {
                    "eval_set": eval_sets[i],
                    "init_model": init_models[i],
                }
            )

        model = FreqaiMultiOutputRegressor(estimator=cbr)
        thread_training = self.freqai_info.get("multitarget_parallel_training", False)
        if thread_training:
            model.n_jobs = y.shape[1]
        model.fit(X=X, y=y, sample_weight=sample_weight, fit_params=fit_params)

        return model
Rehaul organization of return values 2022-07-02 16:09:38 +00:00			`import logging`
isolate and standardize location of tensorboard files, add doc, ensure backtesting functionality 2022-10-09 19:11:37 +00:00			`from pathlib import Path`
chore: update freqai to modern typing syntax 2024-10-04 04:50:31 +00:00			`from typing import Any`
Rehaul organization of return values 2022-07-02 16:09:38 +00:00
enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00			`from catboost import CatBoostRegressor, Pool`
add kwargs, reduce duplicated code 2022-09-07 16:58:55 +00:00
enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00			`from freqtrade.freqai.base_models.BaseRegressionModel import BaseRegressionModel`
			`from freqtrade.freqai.base_models.FreqaiMultiOutputRegressor import FreqaiMultiOutputRegressor`
add continual learning to catboost and friends 2022-09-06 18:30:37 +00:00			`from freqtrade.freqai.data_kitchen import FreqaiDataKitchen`
Rehaul organization of return values 2022-07-02 16:09:38 +00:00

			`logger = logging.getLogger(__name__)`


add classifier, improve model naming scheme 2022-07-09 08:13:33 +00:00			`class CatboostRegressorMultiTarget(BaseRegressionModel):`
Rehaul organization of return values 2022-07-02 16:09:38 +00:00			`"""`
fix model loading from disk bug, improve doc, clarify installation/docker instructions, add a torch tag to the freqairl docker image. Fix seriously outdated prediction_model docstrings 2023-04-08 10:09:53 +00:00			`User created prediction model. The class inherits IFreqaiModel, which`
			`means it has full access to all Frequency AI functionality. Typically,`
			users would use this to override the common `fit()`, `train()`, or
			`predict()` methods to add their custom data handling tools or change
			`various aspects of the training that cannot be configured via the`
			`top level config.json file.`
Rehaul organization of return values 2022-07-02 16:09:38 +00:00			`"""`

chore: update freqai to modern typing syntax 2024-10-04 04:50:31 +00:00			`def fit(self, data_dictionary: dict, dk: FreqaiDataKitchen, **kwargs) -> Any:`
Rehaul organization of return values 2022-07-02 16:09:38 +00:00			`"""`
			`User sets up the training and test data to fit their desired model here`
fix model loading from disk bug, improve doc, clarify installation/docker instructions, add a torch tag to the freqairl docker image. Fix seriously outdated prediction_model docstrings 2023-04-08 10:09:53 +00:00			`:param data_dictionary: the dictionary holding all data for train, test,`
			`labels, weights`
			`:param dk: The datakitchen object for the current coin/model`
Rehaul organization of return values 2022-07-02 16:09:38 +00:00			`"""`

			`cbr = CatBoostRegressor(`
Add сatboost train_dir for tensorboard 2022-10-06 16:59:35 +00:00			`allow_writing_files=True,`
remove tensorboard dir from other pred models 2022-10-11 17:49:24 +00:00			`train_dir=Path(dk.data_path),`
black formatting on freqai files 2022-07-03 08:59:38 +00:00			`**self.model_training_parameters,`
Rehaul organization of return values 2022-07-02 16:09:38 +00:00			`)`

			`X = data_dictionary["train_features"]`
			`y = data_dictionary["train_labels"]`

enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00			`sample_weight = data_dictionary["train_weights"]`
add continual learning to catboost and friends 2022-09-06 18:30:37 +00:00
enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00			`eval_sets = [None] * y.shape[1]`
allow user to pass test_size = 0 and avoid using eval sets in prediction models 2022-07-25 17:40:13 +00:00
ruff format: freqai 2024-05-12 15:12:20 +00:00			`if self.freqai_info.get("data_split_parameters", {}).get("test_size", 0.1) != 0:`
			`eval_sets = [None] * data_dictionary["test_labels"].shape[1]`
enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00
ruff format: freqai 2024-05-12 15:12:20 +00:00			`for i in range(data_dictionary["test_labels"].shape[1]):`
enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00			`eval_sets[i] = Pool(`
			`data=data_dictionary["test_features"],`
			`label=data_dictionary["test_labels"].iloc[:, i],`
			`weight=data_dictionary["test_weights"],`
			`)`

			`init_model = self.get_init_model(dk.pair)`

			`if init_model:`
			`init_models = init_model.estimators_`
			`else:`
			`init_models = [None] * y.shape[1]`

			`fit_params = []`
			`for i in range(len(eval_sets)):`
ruff format: freqai 2024-05-12 15:12:20 +00:00			`fit_params.append(`
			`{`
			`"eval_set": eval_sets[i],`
			`"init_model": init_models[i],`
			`}`
			`)`
enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00
			`model = FreqaiMultiOutputRegressor(estimator=cbr)`
ruff format: freqai 2024-05-12 15:12:20 +00:00			`thread_training = self.freqai_info.get("multitarget_parallel_training", False)`
allow user to multithread jobs (advanced users only) 2022-09-10 20:16:49 +00:00			`if thread_training:`
			`model.n_jobs = y.shape[1]`
enable continual learning and evaluation sets on multioutput models. 2022-09-10 14:54:13 +00:00			`model.fit(X=X, y=y, sample_weight=sample_weight, fit_params=fit_params)`

Rehaul organization of return values 2022-07-02 16:09:38 +00:00			`return model`