From 24830ed164e94d761cce0d94538a55b91908ad67 Mon Sep 17 00:00:00 2001 From: MingzheYang Date: Wed, 28 Jan 2026 23:55:36 +0800 Subject: [PATCH] =?UTF-8?q?larger=20model(=E4=B8=8A=E4=B8=80=E7=89=88?= =?UTF-8?q?=E6=9C=AC=E6=98=AF3.0=E5=AE=8C=E6=95=B4=E7=89=88=EF=BC=89?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- example/config.json | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/example/config.json b/example/config.json index cc0912f..804dcfe 100644 --- a/example/config.json +++ b/example/config.json @@ -7,8 +7,8 @@ "out_dir": "./results", "device": "auto", "timesteps": 600, - "batch_size": 16, - "seq_len": 96, + "batch_size": 32, + "seq_len": 128, "epochs": 10, "max_batches": 4000, "lambda": 0.7, @@ -26,16 +26,16 @@ "use_tanh_eps": false, "eps_scale": 1.0, "model_time_dim": 128, - "model_hidden_dim": 512, + "model_hidden_dim": 768, "model_num_layers": 2, "model_dropout": 0.1, "model_ff_mult": 2, "model_pos_dim": 64, "model_use_pos_embed": true, "backbone_type": "transformer", - "transformer_num_layers": 2, + "transformer_num_layers": 4, "transformer_nhead": 4, - "transformer_ff_dim": 512, + "transformer_ff_dim": 1024, "transformer_dropout": 0.1, "disc_mask_scale": 0.9, "cont_loss_weighting": "inv_std", @@ -57,16 +57,16 @@ "type6_features": ["P4_HT_PO","P2_24Vdc","P2_HILout"], "shuffle_buffer": 256, "use_temporal_stage1": true, - "temporal_hidden_dim": 256, + "temporal_hidden_dim": 384, "temporal_num_layers": 1, "temporal_dropout": 0.0, - "temporal_epochs": 2, + "temporal_epochs": 3, "temporal_lr": 0.001, "quantile_loss_weight": 0.2, "quantile_points": [0.05, 0.25, 0.5, 0.75, 0.95], "snr_weighted_loss": true, "snr_gamma": 1.0, "residual_stat_weight": 0.05, - "sample_batch_size": 4, + "sample_batch_size": 8, "sample_seq_len": 128 }