refactor(reforcexy): improve logging messages

author Jérôme Benoit <jerome.benoit@sap.com>

Sun, 23 Feb 2025 21:28:03 +0000 (22:28 +0100)

committer Jérôme Benoit <jerome.benoit@sap.com>

Sun, 23 Feb 2025 21:28:03 +0000 (22:28 +0100)
author Jérôme Benoit <jerome.benoit@sap.com>
Sun, 23 Feb 2025 21:28:03 +0000 (22:28 +0100)
committer Jérôme Benoit <jerome.benoit@sap.com>
Sun, 23 Feb 2025 21:28:03 +0000 (22:28 +0100)
diff --git a/ReforceXY/user_data/freqaimodels/ReforceXY.py b/ReforceXY/user_data/freqaimodels/ReforceXY.py

index ac0a5153bb97d0c1af9753a11d3f4683fdec3e4e..d7459ebca171b65ae12eccc5bee927bd176c34f2 100644 (file)
--- a/ReforceXY/user_data/freqaimodels/ReforceXY.py
+++ b/ReforceXY/user_data/freqaimodels/ReforceXY.py
@@ -315,7 +315,7 @@ class ReforceXY(BaseReinforcementLearningModel):
          train_df = data_dictionary["train_features"]
          train_timesteps = len(train_df)
          test_timesteps = len(data_dictionary["test_features"])
-        train_cycles = int(self.rl_config.get("train_cycles", 25))
+        train_cycles = int(self.rl_config.get("train_cycles", 250))
          total_timesteps = train_timesteps * train_cycles
          train_days = steps_to_days(train_timesteps, self.config["timeframe"])
          total_days = steps_to_days(total_timesteps, self.config["timeframe"])
@@ -374,8 +374,9 @@ class ReforceXY(BaseReinforcementLearningModel):
          self.dd.update_metric_tracker("fit_time", time_spent, dk.pair)
  
          model_filename = dk.model_filename if dk.model_filename else "best"
-        if Path(dk.data_path / f"{model_filename}_model.zip").is_file():
-            logger.info("Callback found a best model.")
+        model_path = Path(dk.data_path / f"{model_filename}_model.zip")
+        if model_path.is_file():
+            logger.info(f"Callback found a best model: {model_path}.")
              best_model = self.MODELCLASS.load(dk.data_path / f"{model_filename}_model")
              return best_model
  
@@ -792,12 +793,7 @@ class ReforceXY(BaseReinforcementLearningModel):
  
              # reward agent for entering trades
              if (
-                action == Actions.Long_enter.value
-                and self._position == Positions.Neutral
-            ):
-                return 25.0
-            if (
-                action == Actions.Short_enter.value
+                action in (Actions.Long_enter.value, Actions.Short_enter.value)
                  and self._position == Positions.Neutral
              ):
                  return 25.0
author	Jérôme Benoit <jerome.benoit@sap.com>
	Sun, 23 Feb 2025 21:28:03 +0000 (22:28 +0100)
committer	Jérôme Benoit <jerome.benoit@sap.com>
	Sun, 23 Feb 2025 21:28:03 +0000 (22:28 +0100)