larger model(上一版本是3.0完整版)

This commit is contained in:
2026-01-28 23:55:36 +08:00
parent 803336ab06
commit 24830ed164

View File

@@ -7,8 +7,8 @@
"out_dir": "./results",
"device": "auto",
"timesteps": 600,
"batch_size": 16,
"seq_len": 96,
"batch_size": 32,
"seq_len": 128,
"epochs": 10,
"max_batches": 4000,
"lambda": 0.7,
@@ -26,16 +26,16 @@
"use_tanh_eps": false,
"eps_scale": 1.0,
"model_time_dim": 128,
"model_hidden_dim": 512,
"model_hidden_dim": 768,
"model_num_layers": 2,
"model_dropout": 0.1,
"model_ff_mult": 2,
"model_pos_dim": 64,
"model_use_pos_embed": true,
"backbone_type": "transformer",
"transformer_num_layers": 2,
"transformer_num_layers": 4,
"transformer_nhead": 4,
"transformer_ff_dim": 512,
"transformer_ff_dim": 1024,
"transformer_dropout": 0.1,
"disc_mask_scale": 0.9,
"cont_loss_weighting": "inv_std",
@@ -57,16 +57,16 @@
"type6_features": ["P4_HT_PO","P2_24Vdc","P2_HILout"],
"shuffle_buffer": 256,
"use_temporal_stage1": true,
"temporal_hidden_dim": 256,
"temporal_hidden_dim": 384,
"temporal_num_layers": 1,
"temporal_dropout": 0.0,
"temporal_epochs": 2,
"temporal_epochs": 3,
"temporal_lr": 0.001,
"quantile_loss_weight": 0.2,
"quantile_points": [0.05, 0.25, 0.5, 0.75, 0.95],
"snr_weighted_loss": true,
"snr_gamma": 1.0,
"residual_stat_weight": 0.05,
"sample_batch_size": 4,
"sample_batch_size": 8,
"sample_seq_len": 128
}