Add soft bounds, per-feature scaling, and full pipeline runner

2026-01-28 00:35:00 +08:00
parent f0f89abf4f
commit c3fb07ef11
8 changed files with 183 additions and 5 deletions
--- a/docs/README.md
+++ b/docs/README.md
@@ -13,3 +13,4 @@ Conventions:
 Tools:
 - `example/diagnose_ks.py` for per-feature KS + CDF plots.
 - `example/run_all_full.py` for one-command full pipeline + diagnostics.
--- a/docs/decisions.md
+++ b/docs/decisions.md
@@ -55,3 +55,10 @@
 - **Files**:
  - `example/data_utils.py`
  - `example/export_samples.py`
 ## 2026-01-27 — Soft bounds + post-scale for boundary pile-up
 - **Decision**: Replace hard sigmoid bounds with soft tanh bounds and allow per-feature post-scaling.
 - **Why**: Many continuous features collapsed to max bound (KS=1.0).
 - **Files**:
  - `example/export_samples.py`
  - `example/config.json`
--- a/example/config.json
+++ b/example/config.json
@@ -44,7 +44,21 @@
  "cont_clamp_x0": 5.0,
  "use_quantile_transform": true,
  "quantile_bins": 1001,
-  "cont_bound_mode": "sigmoid",
+  "cont_bound_mode": "soft_tanh",
  "cont_bound_strength": 2.0,
  "cont_post_scale": {
    "P1_B4002": 0.8,
    "P1_B400B": 0.8,
    "P1_FT02Z": 0.8,
    "P1_PCV01D": 0.8,
    "P1_PCV01Z": 0.8,
    "P1_PCV02Z": 0.8,
    "P2_24Vdc": 0.8,
    "P2_MSD": 0.8,
    "P3_LCP01D": 0.8,
    "P4_ST_PT01": 0.8,
    "P4_ST_TT01": 0.8
  },
  "shuffle_buffer": 256,
  "use_temporal_stage1": true,
  "temporal_hidden_dim": 256,
--- a/example/config_no_temporal.json
+++ b/example/config_no_temporal.json
@@ -44,7 +44,21 @@
  "cont_clamp_x0": 5.0,
  "use_quantile_transform": true,
  "quantile_bins": 1001,
-  "cont_bound_mode": "sigmoid",
+  "cont_bound_mode": "soft_tanh",
  "cont_bound_strength": 2.0,
  "cont_post_scale": {
    "P1_B4002": 0.8,
    "P1_B400B": 0.8,
    "P1_FT02Z": 0.8,
    "P1_PCV01D": 0.8,
    "P1_PCV01Z": 0.8,
    "P1_PCV02Z": 0.8,
    "P2_24Vdc": 0.8,
    "P2_MSD": 0.8,
    "P3_LCP01D": 0.8,
    "P4_ST_PT01": 0.8,
    "P4_ST_TT01": 0.8
  },
  "shuffle_buffer": 1024,
  "use_temporal_stage1": false,
  "sample_batch_size": 4,
--- a/example/config_temporal_strong.json
+++ b/example/config_temporal_strong.json
@@ -44,7 +44,21 @@
  "cont_clamp_x0": 5.0,
  "use_quantile_transform": true,
  "quantile_bins": 1001,
-  "cont_bound_mode": "sigmoid",
+  "cont_bound_mode": "soft_tanh",
  "cont_bound_strength": 2.0,
  "cont_post_scale": {
    "P1_B4002": 0.8,
    "P1_B400B": 0.8,
    "P1_FT02Z": 0.8,
    "P1_PCV01D": 0.8,
    "P1_PCV01Z": 0.8,
    "P1_PCV02Z": 0.8,
    "P2_24Vdc": 0.8,
    "P2_MSD": 0.8,
    "P3_LCP01D": 0.8,
    "P4_ST_PT01": 0.8,
    "P4_ST_TT01": 0.8
  },
  "shuffle_buffer": 1024,
  "use_temporal_stage1": true,
  "temporal_hidden_dim": 512,
--- a/example/export_samples.py
+++ b/example/export_samples.py
@@ -144,6 +144,8 @@ def main():
    cont_clamp_x0 = float(cfg.get("cont_clamp_x0", 0.0))
    use_quantile = bool(cfg.get("use_quantile_transform", False))
    cont_bound_mode = str(cfg.get("cont_bound_mode", "clamp"))
    cont_bound_strength = float(cfg.get("cont_bound_strength", 1.0))
    cont_post_scale = cfg.get("cont_post_scale", {}) if isinstance(cfg.get("cont_post_scale", {}), dict) else {}
    use_temporal_stage1 = bool(cfg.get("use_temporal_stage1", False))
    temporal_hidden_dim = int(cfg.get("temporal_hidden_dim", 256))
    temporal_num_layers = int(cfg.get("temporal_num_layers", 1))
@@ -287,10 +289,28 @@ def main():
            hi = vmax.get(c, None)
            if lo is None or hi is None:
                continue
            lo = float(lo)
            hi = float(hi)
            if cont_bound_mode == "sigmoid":
-                x_cont[:, :, i] = float(lo) + (float(hi) - float(lo)) * torch.sigmoid(x_cont[:, :, i])
+                x_cont[:, :, i] = lo + (hi - lo) * torch.sigmoid(x_cont[:, :, i])
            elif cont_bound_mode == "soft_tanh":
                # Soft bound without hard piling at edges
                mid = 0.5 * (lo + hi)
                half = 0.5 * (hi - lo)
                denom = cont_bound_strength if cont_bound_strength > 0 else 1.0
                x_cont[:, :, i] = mid + half * torch.tanh(x_cont[:, :, i] / denom)
            else:
-                x_cont[:, :, i] = torch.clamp(x_cont[:, :, i], float(lo), float(hi))
+                x_cont[:, :, i] = torch.clamp(x_cont[:, :, i], lo, hi)
    # optional post-scaling for problematic features
    if cont_post_scale:
        for i, c in enumerate(cont_cols):
            if c in cont_post_scale:
                try:
                    scale = float(cont_post_scale[c])
                except Exception:
                    scale = 1.0
                x_cont[:, :, i] = x_cont[:, :, i] * scale
    header = read_header(data_path)
    out_cols = [c for c in header if c != time_col or args.include_time]
--- a/example/run_all_full.py
+++ b/example/run_all_full.py
@@ -0,0 +1,107 @@
 #!/usr/bin/env python3
 """Run full pipeline + diagnostics in one command."""
 import argparse
 import json
 import subprocess
 import sys
 from pathlib import Path
 from platform_utils import safe_path, is_windows, resolve_path
 def run(cmd):
    print("running:", " ".join(cmd))
    cmd = [safe_path(arg) for arg in cmd]
    if is_windows():
        subprocess.run(cmd, check=True, shell=False)
    else:
        subprocess.run(cmd, check=True)
 def parse_args():
    parser = argparse.ArgumentParser(description="Run prepare -> train -> export -> eval -> diagnostics.")
    base_dir = Path(__file__).resolve().parent
    parser.add_argument("--config", default=str(base_dir / "config.json"))
    parser.add_argument("--device", default="auto", help="cpu, cuda, or auto")
    parser.add_argument("--skip-prepare", action="store_true")
    parser.add_argument("--skip-train", action="store_true")
    parser.add_argument("--skip-export", action="store_true")
    parser.add_argument("--skip-eval", action="store_true")
    parser.add_argument("--skip-diagnose", action="store_true")
    return parser.parse_args()
 def resolve_config(base_dir: Path, cfg_arg: str) -> Path:
    config_path = Path(cfg_arg)
    if config_path.is_absolute():
        return Path(resolve_path(config_path.parent, config_path))
    candidate = base_dir / config_path
    if candidate.exists():
        return Path(resolve_path(candidate.parent, candidate))
    if config_path.exists():
        return Path(resolve_path(config_path.parent, config_path))
    return Path(resolve_path(base_dir, config_path))
 def main():
    args = parse_args()
    base_dir = Path(__file__).resolve().parent
    config_path = resolve_config(base_dir, args.config)
    with open(config_path, "r", encoding="utf-8") as f:
        cfg = json.load(f)
    timesteps = cfg.get("timesteps", 200)
    seq_len = cfg.get("sample_seq_len", cfg.get("seq_len", 64))
    batch_size = cfg.get("sample_batch_size", cfg.get("batch_size", 2))
    clip_k = cfg.get("clip_k", 5.0)
    if not args.skip_prepare:
        run([sys.executable, str(base_dir / "prepare_data.py")])
    if not args.skip_train:
        run([sys.executable, str(base_dir / "train.py"), "--config", str(config_path), "--device", args.device])
    if not args.skip_export:
        run(
            [
                sys.executable,
                str(base_dir / "export_samples.py"),
                "--include-time",
                "--device",
                args.device,
                "--config",
                str(config_path),
                "--timesteps",
                str(timesteps),
                "--seq-len",
                str(seq_len),
                "--batch-size",
                str(batch_size),
                "--clip-k",
                str(clip_k),
                "--use-ema",
            ]
        )
    if not args.skip_eval:
        ref = cfg.get("data_glob") or cfg.get("data_path") or ""
        if ref:
            run([sys.executable, str(base_dir / "evaluate_generated.py"), "--reference", str(ref)])
        else:
            run([sys.executable, str(base_dir / "evaluate_generated.py")])
        run([sys.executable, str(base_dir / "summary_metrics.py")])
    if not args.skip_diagnose:
        run(
            [
                sys.executable,
                str(base_dir / "diagnose_ks.py"),
                "--generated",
                str(base_dir / "results" / "generated.csv"),
                "--reference",
                str(config_path),
                "--top-k",
                "10",
            ]
        )
 if __name__ == "__main__":
    main()
--- a/report.md
+++ b/report.md
@@ -194,6 +194,7 @@ Recent run (user-reported, Windows):
 ## 10. Automation / 自动化
 `example/run_all.py` runs all stages with config-driven paths.
 `example/run_all_full.py` runs prepare/train/export/eval + KS diagnostics in one command.
 `example/run_compare.py` can run a baseline vs temporal config and compute metric deltas.
 ---