2022-07-09 08:13:33 +00:00
|
|
|
import logging
|
2022-10-09 19:11:37 +00:00
|
|
|
from pathlib import Path
|
2022-08-13 18:07:31 +00:00
|
|
|
from typing import Any, Dict
|
|
|
|
|
2022-07-09 08:13:33 +00:00
|
|
|
from catboost import CatBoostClassifier, Pool
|
2022-09-07 16:58:55 +00:00
|
|
|
|
2022-09-10 14:54:13 +00:00
|
|
|
from freqtrade.freqai.base_models.BaseClassifierModel import BaseClassifierModel
|
2022-09-06 18:30:37 +00:00
|
|
|
from freqtrade.freqai.data_kitchen import FreqaiDataKitchen
|
2022-08-13 18:07:31 +00:00
|
|
|
|
2022-07-09 08:13:33 +00:00
|
|
|
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
|
|
|
2022-08-13 18:07:31 +00:00
|
|
|
class CatboostClassifier(BaseClassifierModel):
|
2022-07-09 08:13:33 +00:00
|
|
|
"""
|
|
|
|
User created prediction model. The class needs to override three necessary
|
|
|
|
functions, predict(), train(), fit(). The class inherits ModelHandler which
|
|
|
|
has its own DataHandler where data is held, saved, loaded, and managed.
|
|
|
|
"""
|
|
|
|
|
2022-09-07 16:58:55 +00:00
|
|
|
def fit(self, data_dictionary: Dict, dk: FreqaiDataKitchen, **kwargs) -> Any:
|
2022-07-09 08:13:33 +00:00
|
|
|
"""
|
|
|
|
User sets up the training and test data to fit their desired model here
|
2022-10-10 12:13:41 +00:00
|
|
|
:param data_dictionary: the dictionary constructed by DataHandler to hold
|
|
|
|
all the training and test data/labels.
|
2022-07-09 08:13:33 +00:00
|
|
|
"""
|
|
|
|
|
|
|
|
train_data = Pool(
|
|
|
|
data=data_dictionary["train_features"],
|
|
|
|
label=data_dictionary["train_labels"],
|
|
|
|
weight=data_dictionary["train_weights"],
|
|
|
|
)
|
2022-10-13 20:01:09 +00:00
|
|
|
if self.freqai_info.get("data_split_parameters", {}).get("test_size", 0.1) == 0:
|
|
|
|
test_data = None
|
|
|
|
else:
|
|
|
|
test_data = Pool(
|
|
|
|
data=data_dictionary["test_features"],
|
|
|
|
label=data_dictionary["test_labels"],
|
|
|
|
weight=data_dictionary["test_weights"],
|
|
|
|
)
|
2022-07-09 08:13:33 +00:00
|
|
|
|
|
|
|
cbr = CatBoostClassifier(
|
2022-10-06 16:59:35 +00:00
|
|
|
allow_writing_files=True,
|
2022-07-09 08:13:33 +00:00
|
|
|
loss_function='MultiClass',
|
2022-10-11 17:49:24 +00:00
|
|
|
train_dir=Path(dk.data_path),
|
2022-07-09 08:13:33 +00:00
|
|
|
**self.model_training_parameters,
|
|
|
|
)
|
|
|
|
|
2022-09-07 16:58:55 +00:00
|
|
|
init_model = self.get_init_model(dk.pair)
|
2022-09-06 18:30:37 +00:00
|
|
|
|
2022-10-13 20:01:09 +00:00
|
|
|
cbr.fit(X=train_data, eval_set=test_data, init_model=init_model)
|
2022-07-09 08:13:33 +00:00
|
|
|
|
|
|
|
return cbr
|