larger model(上一版本是3.0完整版)

This commit is contained in:
2026-01-28 23:55:36 +08:00
parent 803336ab06
commit 24830ed164

View File

@@ -7,8 +7,8 @@
"out_dir": "./results", "out_dir": "./results",
"device": "auto", "device": "auto",
"timesteps": 600, "timesteps": 600,
"batch_size": 16, "batch_size": 32,
"seq_len": 96, "seq_len": 128,
"epochs": 10, "epochs": 10,
"max_batches": 4000, "max_batches": 4000,
"lambda": 0.7, "lambda": 0.7,
@@ -26,16 +26,16 @@
"use_tanh_eps": false, "use_tanh_eps": false,
"eps_scale": 1.0, "eps_scale": 1.0,
"model_time_dim": 128, "model_time_dim": 128,
"model_hidden_dim": 512, "model_hidden_dim": 768,
"model_num_layers": 2, "model_num_layers": 2,
"model_dropout": 0.1, "model_dropout": 0.1,
"model_ff_mult": 2, "model_ff_mult": 2,
"model_pos_dim": 64, "model_pos_dim": 64,
"model_use_pos_embed": true, "model_use_pos_embed": true,
"backbone_type": "transformer", "backbone_type": "transformer",
"transformer_num_layers": 2, "transformer_num_layers": 4,
"transformer_nhead": 4, "transformer_nhead": 4,
"transformer_ff_dim": 512, "transformer_ff_dim": 1024,
"transformer_dropout": 0.1, "transformer_dropout": 0.1,
"disc_mask_scale": 0.9, "disc_mask_scale": 0.9,
"cont_loss_weighting": "inv_std", "cont_loss_weighting": "inv_std",
@@ -57,16 +57,16 @@
"type6_features": ["P4_HT_PO","P2_24Vdc","P2_HILout"], "type6_features": ["P4_HT_PO","P2_24Vdc","P2_HILout"],
"shuffle_buffer": 256, "shuffle_buffer": 256,
"use_temporal_stage1": true, "use_temporal_stage1": true,
"temporal_hidden_dim": 256, "temporal_hidden_dim": 384,
"temporal_num_layers": 1, "temporal_num_layers": 1,
"temporal_dropout": 0.0, "temporal_dropout": 0.0,
"temporal_epochs": 2, "temporal_epochs": 3,
"temporal_lr": 0.001, "temporal_lr": 0.001,
"quantile_loss_weight": 0.2, "quantile_loss_weight": 0.2,
"quantile_points": [0.05, 0.25, 0.5, 0.75, 0.95], "quantile_points": [0.05, 0.25, 0.5, 0.75, 0.95],
"snr_weighted_loss": true, "snr_weighted_loss": true,
"snr_gamma": 1.0, "snr_gamma": 1.0,
"residual_stat_weight": 0.05, "residual_stat_weight": 0.05,
"sample_batch_size": 4, "sample_batch_size": 8,
"sample_seq_len": 128 "sample_seq_len": 128
} }