fix(weights): tighten observability and edge-case handling in label pipeline

author Jérôme Benoit <jerome.benoit@piment-noir.org>

Mon, 25 May 2026 00:31:49 +0000 (02:31 +0200)

committer Jérôme Benoit <jerome.benoit@piment-noir.org>

Mon, 25 May 2026 00:31:49 +0000 (02:31 +0200)
author Jérôme Benoit <jerome.benoit@piment-noir.org>
Mon, 25 May 2026 00:31:49 +0000 (02:31 +0200)
committer Jérôme Benoit <jerome.benoit@piment-noir.org>
Mon, 25 May 2026 00:31:49 +0000 (02:31 +0200)
diff --git a/quickadapter/user_data/freqaimodels/QuickAdapterRegressorV3.py b/quickadapter/user_data/freqaimodels/QuickAdapterRegressorV3.py

index 6e50be14a2f2389e858bfe277f93427b5cb2d868..c1a74a907aa5a408c8c69990c3716b921363574f 100644 (file)
--- a/quickadapter/user_data/freqaimodels/QuickAdapterRegressorV3.py
+++ b/quickadapter/user_data/freqaimodels/QuickAdapterRegressorV3.py
@@ -1118,6 +1118,12 @@ class QuickAdapterRegressorV3(BaseRegressionModel):
              logger.info(
                  f"    keep_fraction: {format_number(col_prediction['keep_fraction'])}"
              )
+            if col_prediction["method"] == PREDICTION_METHODS[0]:  # "none"
+                logger.warning(
+                    f"  Prediction method is 'none' for label [{label_col}]: "
+                    f"minima_threshold/maxima_threshold will not be computed and "
+                    f"entry signals based on them will never trigger."
+                )
  
          default_label_period_candles, default_label_natr_multiplier = (
              self._label_defaults
@@ -1483,9 +1489,13 @@ class QuickAdapterRegressorV3(BaseRegressionModel):
                      )
                  )
  
-        train_weights = sanitize_and_renormalize(train_weights)
+        train_weights = sanitize_and_renormalize(
+            train_weights, logger=logger, context="train_test_split:train"
+        )
          if test_size != 0:
-            test_weights = sanitize_and_renormalize(test_weights)
+            test_weights = sanitize_and_renormalize(
+                test_weights, logger=logger, context="train_test_split:test"
+            )
  
          if feat_dict.get("reverse_train_test_order", False):
              return dk.build_data_dictionary(
@@ -1644,7 +1654,11 @@ class QuickAdapterRegressorV3(BaseRegressionModel):
                  dd["train_features"], dd["train_labels"], dd["train_weights"]
              )
          )
-        dd["train_weights"] = sanitize_and_renormalize(dd["train_weights"])
+        dd["train_weights"] = sanitize_and_renormalize(
+            dd["train_weights"],
+            logger=logger,
+            context="post_feature_pipeline:train",
+        )
          dd["train_labels"], _, _ = dk.label_pipeline.fit_transform(dd["train_labels"])
  
          if (
@@ -1693,7 +1707,11 @@ class QuickAdapterRegressorV3(BaseRegressionModel):
                          dd["test_features"], dd["test_labels"], dd["test_weights"]
                      )
                  )
-                dd["test_weights"] = sanitize_and_renormalize(dd["test_weights"])
+                dd["test_weights"] = sanitize_and_renormalize(
+                    dd["test_weights"],
+                    logger=logger,
+                    context="post_feature_pipeline:test",
+                )
                  dd["test_labels"], _, _ = dk.label_pipeline.transform(dd["test_labels"])
  
          return dd
@@ -1803,8 +1821,12 @@ class QuickAdapterRegressorV3(BaseRegressionModel):
          test_features = filtered_dataframe.iloc[test_idx]
          train_labels = labels.iloc[train_idx]
          test_labels = labels.iloc[test_idx]
-        train_weights = sanitize_and_renormalize(weights[train_idx])
-        test_weights = sanitize_and_renormalize(weights[test_idx])
+        train_weights = sanitize_and_renormalize(
+            weights[train_idx], logger=logger, context="timeseries_split:train"
+        )
+        test_weights = sanitize_and_renormalize(
+            weights[test_idx], logger=logger, context="timeseries_split:test"
+        )
  
          if feat_dict.get("reverse_train_test_order", False):
              return dk.build_data_dictionary(
diff --git a/quickadapter/user_data/strategies/QuickAdapterV3.py b/quickadapter/user_data/strategies/QuickAdapterV3.py

index e839555ad1c702696a1fe9426447b6b5002ad56a..223221e83cda964461a886f1359600f796b9fcc2 100644 (file)
--- a/quickadapter/user_data/strategies/QuickAdapterV3.py
+++ b/quickadapter/user_data/strategies/QuickAdapterV3.py
@@ -860,7 +860,8 @@ class QuickAdapterV3(IStrategy):
                  dataframe[label_weight_col], **col_smoothing_config
              )
              dataframe[label_weight_col] = smoothed_label_weights.where(
-                smoothed_label_weights.gt(0) & smoothed_label_weights.notna(), 0.0
+                np.isfinite(smoothed_label_weights) & smoothed_label_weights.gt(0),
+                0.0,
              )
  
              if label_col == EXTREMA_COLUMN:
diff --git a/quickadapter/user_data/strategies/Utils.py b/quickadapter/user_data/strategies/Utils.py

index b168eb31c94316f459461e8b9b665e40da59116c..2c93905c4be5cd4254357b924d90002cd26f205f 100644 (file)
--- a/quickadapter/user_data/strategies/Utils.py
+++ b/quickadapter/user_data/strategies/Utils.py
@@ -717,6 +717,9 @@ def midpoint(value1: T, value2: T) -> T:
  def sanitize_and_renormalize(
      arr: NDArray[np.floating],
      drop_mask: NDArray[np.bool_] | None = None,
+    *,
+    logger: Logger | None = None,
+    context: str | None = None,
  ) -> NDArray[np.floating]:
      arr = np.asarray(arr, dtype=float)
      if arr.size == 0:
@@ -728,6 +731,14 @@ def sanitize_and_renormalize(
      total = safe.sum()
      if total > 0 and np.isfinite(total):
          return safe * (len(safe) / total)
+    if logger is not None:
+        logger.warning(
+            "sanitize_and_renormalize: weights collapsed (context=%s, total=%r, "
+            "n=%d); falling back to uniform weights",
+            context or "unspecified",
+            total,
+            len(arr),
+        )
      fallback = np.ones_like(arr)
      if drop_mask is not None:
          fallback[drop_mask] = 0.0
@@ -974,21 +985,27 @@ def _impute_weights(
      if weights.size == 0:
          return np.full_like(weights, default_weight, dtype=float)
  
-    # Weights computed by `zigzag` can be NaN on boundary pivots
+    # Zigzag emits NaN at unconfirmed boundary pivots; zero them out and
+    # exclude from the median so they don't drag interior imputation.
+    boundary_mask = np.zeros(weights.size, dtype=bool)
      if not np.isfinite(weights[0]):
-        weights[0] = 0.0
+        boundary_mask[0] = True
      if not np.isfinite(weights[-1]):
-        weights[-1] = 0.0
+        boundary_mask[-1] = True
  
      finite_mask = np.isfinite(weights)
-    if not finite_mask.any():
-        return np.full_like(weights, default_weight, dtype=float)
+    interior_finite_mask = finite_mask & ~boundary_mask
+    if not interior_finite_mask.any():
+        weights[~finite_mask] = default_weight
+        weights[boundary_mask] = 0.0
+        return weights
  
-    median_weight = np.nanmedian(weights[finite_mask])
+    median_weight = np.nanmedian(weights[interior_finite_mask])
      if not np.isfinite(median_weight):
          median_weight = default_weight
  
      weights[~finite_mask] = median_weight
+    weights[boundary_mask] = 0.0
  
      return weights
author	Jérôme Benoit <jerome.benoit@piment-noir.org>
	Mon, 25 May 2026 00:31:49 +0000 (02:31 +0200)
committer	Jérôme Benoit <jerome.benoit@piment-noir.org>
	Mon, 25 May 2026 00:31:49 +0000 (02:31 +0200)
quickadapter/user_data/freqaimodels/QuickAdapterRegressorV3.py		patch \| blob \| blame \| history
quickadapter/user_data/strategies/QuickAdapterV3.py		patch \| blob \| blame \| history
quickadapter/user_data/strategies/Utils.py		patch \| blob \| blame \| history