]> Piment Noir Git Repositories - freqai-strategies.git/commitdiff
docs(reforcexy): refine README.md
authorJérôme Benoit <jerome.benoit@piment-noir.org>
Fri, 10 Oct 2025 10:27:16 +0000 (12:27 +0200)
committerJérôme Benoit <jerome.benoit@piment-noir.org>
Fri, 10 Oct 2025 10:27:16 +0000 (12:27 +0200)
Signed-off-by: Jérôme Benoit <jerome.benoit@piment-noir.org>
ReforceXY/reward_space_analysis/README.md
quickadapter/user_data/strategies/QuickAdapterV3.py

index d63d4a359c4ed2949535828553659992b0a53a24..79502c719bea23dffb573a8ac762d650281fc95e 100644 (file)
@@ -161,7 +161,7 @@ python reward_space_analysis.py \
 # Then compare:
 python reward_space_analysis.py \
     --num_samples 100000 \
-    --real_episodes ../user_data/transitions/*.pkl \
+    --real_episodes path/to/episode_rewards.pkl \
     --output real_vs_synthetic
 ```
 
@@ -315,7 +315,7 @@ _Invariant / safety controls:_
 
 - Path to real episode rewards pickle file for distribution comparison
 - Enables distribution shift analysis (KL(synthetic‖real), JS distance, Wasserstein distance, KS test)
-- Example: `../user_data/models/ReforceXY-PPO/sub_train_SYMBOL_DATE/episode_rewards.pkl`
+- Example: `path/to/episode_rewards.pkl`
 
 **`--pvalue_adjust`** (choice: none|benjamini_hochberg, default: none)
 
@@ -383,7 +383,7 @@ python reward_space_analysis.py \
 # Real vs synthetic comparison
 python reward_space_analysis.py \
     --num_samples 100000 \
-    --real_episodes ../user_data/models/path/to/episode_rewards.pkl \
+    --real_episodes path/to/episode_rewards.pkl \
     --output validation
 ```
 
@@ -479,7 +479,7 @@ For production validation, compare synthetic analysis with real trading episodes
 ```shell
 python reward_space_analysis.py \
     --num_samples 100000 \
-    --real_episodes ../user_data/transitions/episode_rewards.pkl \
+    --real_episodes path/to/episode_rewards.pkl \
     --output real_vs_synthetic
 ```
 
index 0973ac21cb39c895f2f8480937767ff9a9352b8d..2717763e95ac1fcf3b111fd511953028a33f56d2 100644 (file)
@@ -1243,7 +1243,7 @@ class QuickAdapterV3(IStrategy):
                     f"User denied {trade_direction} {order} for {pair}: "
                     f"close_k[{-k}] {format_number(close_k)} "
                     f"did not break threshold_k[{-(k + 1)}] {format_number(threshold_k)} "
-                    f"(decayed min/max natr_ratio_percent: min={format_number(decayed_min_natr_ratio_percent)}, max={format_number(decayed_max_natr_ratio_percent)})"
+                    f"(decayed natr_ratio_percent: min={format_number(decayed_min_natr_ratio_percent)}, max={format_number(decayed_max_natr_ratio_percent)})"
                 )
                 return False