From: Jérôme Benoit Date: Mon, 29 Dec 2025 15:27:29 +0000 (+0100) Subject: perf(ReforceXY): tune default hold potential ratio to 0.03125 X-Git-Url: https://git.piment-noir.org/?a=commitdiff_plain;h=fddb641a9f1e1a209d8e76e04dcd577e553f0d63;p=freqai-strategies.git perf(ReforceXY): tune default hold potential ratio to 0.03125 Signed-off-by: Jérôme Benoit --- diff --git a/ReforceXY/reward_space_analysis/README.md b/ReforceXY/reward_space_analysis/README.md index 65450f4..df8b2cf 100644 --- a/ReforceXY/reward_space_analysis/README.md +++ b/ReforceXY/reward_space_analysis/README.md @@ -334,7 +334,7 @@ across samples) and does not apply any drift correction in post-processing. | Parameter | Default | Description | | ----------------------------------- | -------- | -------------------- | -| `hold_potential_ratio` | 0.015625 | Hold potential ratio | +| `hold_potential_ratio` | 0.03125 | Hold potential ratio | | `hold_potential_gain` | 1.0 | Gain multiplier | | `hold_potential_transform_pnl` | tanh | PnL transform | | `hold_potential_transform_duration` | tanh | Duration transform | diff --git a/ReforceXY/reward_space_analysis/reward_space_analysis.py b/ReforceXY/reward_space_analysis/reward_space_analysis.py index a8ac936..e6daa92 100644 --- a/ReforceXY/reward_space_analysis/reward_space_analysis.py +++ b/ReforceXY/reward_space_analysis/reward_space_analysis.py @@ -164,7 +164,7 @@ DEFAULT_MODEL_REWARD_PARAMETERS: RewardParams = { "exit_potential_decay": 0.5, # Hold potential (PBRS function Φ) "hold_potential_enabled": True, - "hold_potential_ratio": 0.015625, + "hold_potential_ratio": 0.03125, "hold_potential_gain": 1.0, "hold_potential_transform_pnl": "tanh", "hold_potential_transform_duration": "tanh", diff --git a/ReforceXY/reward_space_analysis/tests/constants.py b/ReforceXY/reward_space_analysis/tests/constants.py index ba564e7..887aafe 100644 --- a/ReforceXY/reward_space_analysis/tests/constants.py +++ b/ReforceXY/reward_space_analysis/tests/constants.py @@ -285,7 +285,7 @@ class TestParameters: ADDITIVE_GAIN_DEFAULT: Default additive gain (1.0) # PBRS hold potential parameters - HOLD_POTENTIAL_RATIO_DEFAULT: Default hold potential ratio (0.015625) + HOLD_POTENTIAL_RATIO_DEFAULT: Default hold potential ratio (0.03125) """ BASE_FACTOR: float = 90.0 @@ -315,7 +315,7 @@ class TestParameters: ADDITIVE_GAIN_DEFAULT: float = 1.0 # PBRS hold potential parameters - HOLD_POTENTIAL_RATIO_DEFAULT: float = 0.015625 + HOLD_POTENTIAL_RATIO_DEFAULT: float = 0.03125 @dataclass(frozen=True) diff --git a/ReforceXY/user_data/freqaimodels/ReforceXY.py b/ReforceXY/user_data/freqaimodels/ReforceXY.py index be8e942..4bdba9e 100644 --- a/ReforceXY/user_data/freqaimodels/ReforceXY.py +++ b/ReforceXY/user_data/freqaimodels/ReforceXY.py @@ -161,7 +161,7 @@ class ReforceXY(BaseReinforcementLearningModel): DEFAULT_ENTRY_ADDITIVE_RATIO: Final[float] = 0.125 DEFAULT_ENTRY_ADDITIVE_GAIN: Final[float] = 1.0 DEFAULT_HOLD_POTENTIAL_ENABLED: Final[bool] = True - DEFAULT_HOLD_POTENTIAL_RATIO: Final[float] = 0.015625 + DEFAULT_HOLD_POTENTIAL_RATIO: Final[float] = 0.03125 DEFAULT_HOLD_POTENTIAL_GAIN: Final[float] = 1.0 DEFAULT_EXIT_ADDITIVE_ENABLED: Final[bool] = False DEFAULT_EXIT_ADDITIVE_RATIO: Final[float] = 0.125 diff --git a/ReforceXY/user_data/strategies/RLAgentStrategy.py b/ReforceXY/user_data/strategies/RLAgentStrategy.py index 29487ff..dadcce6 100644 --- a/ReforceXY/user_data/strategies/RLAgentStrategy.py +++ b/ReforceXY/user_data/strategies/RLAgentStrategy.py @@ -1,6 +1,6 @@ import datetime import logging -from functools import cached_property, reduce +from functools import reduce from typing import Any, Final, Literal, Optional # import talib.abstract as ta