From: Jérôme Benoit <jerome.benoit@piment-noir.org>
Date: Mon, 29 Dec 2025 15:27:29 +0000 (+0100)
Subject: perf(ReforceXY): tune default hold potential ratio to 0.03125
X-Git-Url: https://git.piment-noir.org/?a=commitdiff_plain;h=fddb641a9f1e1a209d8e76e04dcd577e553f0d63;p=freqai-strategies.git

perf(ReforceXY): tune default hold potential ratio to 0.03125

Signed-off-by: Jérôme Benoit <jerome.benoit@piment-noir.org>
---

diff --git a/ReforceXY/reward_space_analysis/README.md b/ReforceXY/reward_space_analysis/README.md
index 65450f4..df8b2cf 100644
--- a/ReforceXY/reward_space_analysis/README.md
+++ b/ReforceXY/reward_space_analysis/README.md
@@ -334,7 +334,7 @@ across samples) and does not apply any drift correction in post-processing.
 
 | Parameter                           | Default  | Description          |
 | ----------------------------------- | -------- | -------------------- |
-| `hold_potential_ratio`              | 0.015625 | Hold potential ratio |
+| `hold_potential_ratio`              | 0.03125  | Hold potential ratio |
 | `hold_potential_gain`               | 1.0      | Gain multiplier      |
 | `hold_potential_transform_pnl`      | tanh     | PnL transform        |
 | `hold_potential_transform_duration` | tanh     | Duration transform   |
diff --git a/ReforceXY/reward_space_analysis/reward_space_analysis.py b/ReforceXY/reward_space_analysis/reward_space_analysis.py
index a8ac936..e6daa92 100644
--- a/ReforceXY/reward_space_analysis/reward_space_analysis.py
+++ b/ReforceXY/reward_space_analysis/reward_space_analysis.py
@@ -164,7 +164,7 @@ DEFAULT_MODEL_REWARD_PARAMETERS: RewardParams = {
     "exit_potential_decay": 0.5,
     # Hold potential (PBRS function Î¦)
     "hold_potential_enabled": True,
-    "hold_potential_ratio": 0.015625,
+    "hold_potential_ratio": 0.03125,
     "hold_potential_gain": 1.0,
     "hold_potential_transform_pnl": "tanh",
     "hold_potential_transform_duration": "tanh",
diff --git a/ReforceXY/reward_space_analysis/tests/constants.py b/ReforceXY/reward_space_analysis/tests/constants.py
index ba564e7..887aafe 100644
--- a/ReforceXY/reward_space_analysis/tests/constants.py
+++ b/ReforceXY/reward_space_analysis/tests/constants.py
@@ -285,7 +285,7 @@ class TestParameters:
         ADDITIVE_GAIN_DEFAULT: Default additive gain (1.0)
 
         # PBRS hold potential parameters
-        HOLD_POTENTIAL_RATIO_DEFAULT: Default hold potential ratio (0.015625)
+        HOLD_POTENTIAL_RATIO_DEFAULT: Default hold potential ratio (0.03125)
     """
 
     BASE_FACTOR: float = 90.0
@@ -315,7 +315,7 @@ class TestParameters:
     ADDITIVE_GAIN_DEFAULT: float = 1.0
 
     # PBRS hold potential parameters
-    HOLD_POTENTIAL_RATIO_DEFAULT: float = 0.015625
+    HOLD_POTENTIAL_RATIO_DEFAULT: float = 0.03125
 
 
 @dataclass(frozen=True)
diff --git a/ReforceXY/user_data/freqaimodels/ReforceXY.py b/ReforceXY/user_data/freqaimodels/ReforceXY.py
index be8e942..4bdba9e 100644
--- a/ReforceXY/user_data/freqaimodels/ReforceXY.py
+++ b/ReforceXY/user_data/freqaimodels/ReforceXY.py
@@ -161,7 +161,7 @@ class ReforceXY(BaseReinforcementLearningModel):
     DEFAULT_ENTRY_ADDITIVE_RATIO: Final[float] = 0.125
     DEFAULT_ENTRY_ADDITIVE_GAIN: Final[float] = 1.0
     DEFAULT_HOLD_POTENTIAL_ENABLED: Final[bool] = True
-    DEFAULT_HOLD_POTENTIAL_RATIO: Final[float] = 0.015625
+    DEFAULT_HOLD_POTENTIAL_RATIO: Final[float] = 0.03125
     DEFAULT_HOLD_POTENTIAL_GAIN: Final[float] = 1.0
     DEFAULT_EXIT_ADDITIVE_ENABLED: Final[bool] = False
     DEFAULT_EXIT_ADDITIVE_RATIO: Final[float] = 0.125
diff --git a/ReforceXY/user_data/strategies/RLAgentStrategy.py b/ReforceXY/user_data/strategies/RLAgentStrategy.py
index 29487ff..dadcce6 100644
--- a/ReforceXY/user_data/strategies/RLAgentStrategy.py
+++ b/ReforceXY/user_data/strategies/RLAgentStrategy.py
@@ -1,6 +1,6 @@
 import datetime
 import logging
-from functools import cached_property, reduce
+from functools import reduce
 from typing import Any, Final, Literal, Optional
 
 # import talib.abstract as ta