larger model(上一版本是3.0完整版)
This commit is contained in:
@@ -7,8 +7,8 @@
|
|||||||
"out_dir": "./results",
|
"out_dir": "./results",
|
||||||
"device": "auto",
|
"device": "auto",
|
||||||
"timesteps": 600,
|
"timesteps": 600,
|
||||||
"batch_size": 16,
|
"batch_size": 32,
|
||||||
"seq_len": 96,
|
"seq_len": 128,
|
||||||
"epochs": 10,
|
"epochs": 10,
|
||||||
"max_batches": 4000,
|
"max_batches": 4000,
|
||||||
"lambda": 0.7,
|
"lambda": 0.7,
|
||||||
@@ -26,16 +26,16 @@
|
|||||||
"use_tanh_eps": false,
|
"use_tanh_eps": false,
|
||||||
"eps_scale": 1.0,
|
"eps_scale": 1.0,
|
||||||
"model_time_dim": 128,
|
"model_time_dim": 128,
|
||||||
"model_hidden_dim": 512,
|
"model_hidden_dim": 768,
|
||||||
"model_num_layers": 2,
|
"model_num_layers": 2,
|
||||||
"model_dropout": 0.1,
|
"model_dropout": 0.1,
|
||||||
"model_ff_mult": 2,
|
"model_ff_mult": 2,
|
||||||
"model_pos_dim": 64,
|
"model_pos_dim": 64,
|
||||||
"model_use_pos_embed": true,
|
"model_use_pos_embed": true,
|
||||||
"backbone_type": "transformer",
|
"backbone_type": "transformer",
|
||||||
"transformer_num_layers": 2,
|
"transformer_num_layers": 4,
|
||||||
"transformer_nhead": 4,
|
"transformer_nhead": 4,
|
||||||
"transformer_ff_dim": 512,
|
"transformer_ff_dim": 1024,
|
||||||
"transformer_dropout": 0.1,
|
"transformer_dropout": 0.1,
|
||||||
"disc_mask_scale": 0.9,
|
"disc_mask_scale": 0.9,
|
||||||
"cont_loss_weighting": "inv_std",
|
"cont_loss_weighting": "inv_std",
|
||||||
@@ -57,16 +57,16 @@
|
|||||||
"type6_features": ["P4_HT_PO","P2_24Vdc","P2_HILout"],
|
"type6_features": ["P4_HT_PO","P2_24Vdc","P2_HILout"],
|
||||||
"shuffle_buffer": 256,
|
"shuffle_buffer": 256,
|
||||||
"use_temporal_stage1": true,
|
"use_temporal_stage1": true,
|
||||||
"temporal_hidden_dim": 256,
|
"temporal_hidden_dim": 384,
|
||||||
"temporal_num_layers": 1,
|
"temporal_num_layers": 1,
|
||||||
"temporal_dropout": 0.0,
|
"temporal_dropout": 0.0,
|
||||||
"temporal_epochs": 2,
|
"temporal_epochs": 3,
|
||||||
"temporal_lr": 0.001,
|
"temporal_lr": 0.001,
|
||||||
"quantile_loss_weight": 0.2,
|
"quantile_loss_weight": 0.2,
|
||||||
"quantile_points": [0.05, 0.25, 0.5, 0.75, 0.95],
|
"quantile_points": [0.05, 0.25, 0.5, 0.75, 0.95],
|
||||||
"snr_weighted_loss": true,
|
"snr_weighted_loss": true,
|
||||||
"snr_gamma": 1.0,
|
"snr_gamma": 1.0,
|
||||||
"residual_stat_weight": 0.05,
|
"residual_stat_weight": 0.05,
|
||||||
"sample_batch_size": 4,
|
"sample_batch_size": 8,
|
||||||
"sample_seq_len": 128
|
"sample_seq_len": 128
|
||||||
}
|
}
|
||||||
|
|||||||
Reference in New Issue
Block a user