Closed Kazeya27 closed 1 month ago
PEMSD8 { "embed_dim": 64, "skip_dim": 256, "geo_num_heads": 4, "sem_num_heads": 2, "t_num_heads": 2, "mlp_ratio": 4, "qkv_bias": true, "drop": 0, "attn_drop": 0, "drop_path": 0.3, "s_attn_size": 3, "t_attn_size": 1, "enc_depth": 6, "type_ln": "pre", "type_short_path": "hop", "scaler": "standard", "load_external": true, "normal_external": false, "ext_scaler": "none", "add_time_in_day": true, "add_day_in_week": true, "batch_size": 16, "seed": 1, "max_epoch": 200, "learner": "adamw", "learning_rate": 1e-3, "weight_decay": 0.05, "lr_decay": true, "lr_scheduler": "cosinelr", "lr_eta_min": 1e-4, "lr_decay_ratio": 0.1, "lr_warmup_epoch": 5, "lr_warmup_init": 1e-6, "clip_grad_norm": true, "max_grad_norm": 5, "use_early_stop": true, "patience": 50, "step_size": 2776, "task_level": 0, "use_curriculum_learning": true, "random_flip": true, "huber_delta": 2, "quan_delta": 0.25, "bidir": true, "far_mask_delta": 7, "dtw_delta": 5, "set_loss": "huber", "cluster_method": "kshape", "cand_key_days": 21 }
{ "embed_dim": 64, "skip_dim": 256, "geo_num_heads": 4, "sem_num_heads": 2, "t_num_heads": 2, "mlp_ratio": 4, "qkv_bias": true, "drop": 0, "attn_drop": 0, "drop_path": 0.3, "s_attn_size": 3, "t_attn_size": 1, "enc_depth": 6, "type_ln": "pre", "type_short_path": "hop", "scaler": "standard", "load_external": true, "normal_external": false, "ext_scaler": "none", "add_time_in_day": true, "add_day_in_week": true, "batch_size": 16, "seed": 1, "max_epoch": 200, "learner": "adamw", "learning_rate": 1e-3, "weight_decay": 0.05, "lr_decay": true, "lr_scheduler": "cosinelr", "lr_eta_min": 1e-4, "lr_decay_ratio": 0.1, "lr_warmup_epoch": 5, "lr_warmup_init": 1e-6, "clip_grad_norm": true, "max_grad_norm": 5, "use_early_stop": true, "patience": 50, "step_size": 2776, "task_level": 0, "use_curriculum_learning": true, "random_flip": true, "huber_delta": 2, "quan_delta": 0.25, "bidir": true, "far_mask_delta": 7, "dtw_delta": 5, "set_loss": "huber", "cluster_method": "kshape", "cand_key_days": 21 }
PEMSD4 { "embed_dim": 64, "skip_dim": 256, "geo_num_heads": 4, "sem_num_heads": 2, "t_num_heads": 2, "mlp_ratio": 4, "qkv_bias": true, "drop": 0, "attn_drop": 0, "drop_path": 0.3, "s_attn_size": 3, "t_attn_size": 1, "enc_depth": 6, "type_ln": "pre", "type_short_path": "hop", "scaler": "standard", "load_external": true, "normal_external": false, "ext_scaler": "none", "add_time_in_day": true, "add_day_in_week": true, "batch_size": 16, "seed": 0, "max_epoch": 200, "learner": "adamw", "learning_rate": 1e-3, "weight_decay": 0.05, "lr_decay": true, "lr_scheduler": "cosinelr", "lr_eta_min": 1e-4, "lr_decay_ratio": 0.1, "lr_warmup_epoch": 5, "lr_warmup_init": 1e-6, "clip_grad_norm": true, "max_grad_norm": 5, "use_early_stop": true, "patience": 50, "step_size": 1274, "task_level": 0, "use_curriculum_learning": true, "random_flip": true, "huber_delta": 2, "quan_delta": 0.25, "bidir": true, "far_mask_delta": 7, "dtw_delta": 5, "set_loss": "huber", "cluster_method": "kshape", "cand_key_days": 14 }
{ "embed_dim": 64, "skip_dim": 256, "geo_num_heads": 4, "sem_num_heads": 2, "t_num_heads": 2, "mlp_ratio": 4, "qkv_bias": true, "drop": 0, "attn_drop": 0, "drop_path": 0.3, "s_attn_size": 3, "t_attn_size": 1, "enc_depth": 6, "type_ln": "pre", "type_short_path": "hop", "scaler": "standard", "load_external": true, "normal_external": false, "ext_scaler": "none", "add_time_in_day": true, "add_day_in_week": true, "batch_size": 16, "seed": 0, "max_epoch": 200, "learner": "adamw", "learning_rate": 1e-3, "weight_decay": 0.05, "lr_decay": true, "lr_scheduler": "cosinelr", "lr_eta_min": 1e-4, "lr_decay_ratio": 0.1, "lr_warmup_epoch": 5, "lr_warmup_init": 1e-6, "clip_grad_norm": true, "max_grad_norm": 5, "use_early_stop": true, "patience": 50, "step_size": 1274, "task_level": 0, "use_curriculum_learning": true, "random_flip": true, "huber_delta": 2, "quan_delta": 0.25, "bidir": true, "far_mask_delta": 7, "dtw_delta": 5, "set_loss": "huber", "cluster_method": "kshape", "cand_key_days": 14 }
配置文件
PEMSD8
{ "embed_dim": 64, "skip_dim": 256, "geo_num_heads": 4, "sem_num_heads": 2, "t_num_heads": 2, "mlp_ratio": 4, "qkv_bias": true, "drop": 0, "attn_drop": 0, "drop_path": 0.3, "s_attn_size": 3, "t_attn_size": 1, "enc_depth": 6, "type_ln": "pre", "type_short_path": "hop", "scaler": "standard", "load_external": true, "normal_external": false, "ext_scaler": "none", "add_time_in_day": true, "add_day_in_week": true, "batch_size": 16, "seed": 1, "max_epoch": 200, "learner": "adamw", "learning_rate": 1e-3, "weight_decay": 0.05, "lr_decay": true, "lr_scheduler": "cosinelr", "lr_eta_min": 1e-4, "lr_decay_ratio": 0.1, "lr_warmup_epoch": 5, "lr_warmup_init": 1e-6, "clip_grad_norm": true, "max_grad_norm": 5, "use_early_stop": true, "patience": 50, "step_size": 2776, "task_level": 0, "use_curriculum_learning": true, "random_flip": true, "huber_delta": 2, "quan_delta": 0.25, "bidir": true, "far_mask_delta": 7, "dtw_delta": 5, "set_loss": "huber", "cluster_method": "kshape", "cand_key_days": 21 }
PEMSD4
{ "embed_dim": 64, "skip_dim": 256, "geo_num_heads": 4, "sem_num_heads": 2, "t_num_heads": 2, "mlp_ratio": 4, "qkv_bias": true, "drop": 0, "attn_drop": 0, "drop_path": 0.3, "s_attn_size": 3, "t_attn_size": 1, "enc_depth": 6, "type_ln": "pre", "type_short_path": "hop", "scaler": "standard", "load_external": true, "normal_external": false, "ext_scaler": "none", "add_time_in_day": true, "add_day_in_week": true, "batch_size": 16, "seed": 0, "max_epoch": 200, "learner": "adamw", "learning_rate": 1e-3, "weight_decay": 0.05, "lr_decay": true, "lr_scheduler": "cosinelr", "lr_eta_min": 1e-4, "lr_decay_ratio": 0.1, "lr_warmup_epoch": 5, "lr_warmup_init": 1e-6, "clip_grad_norm": true, "max_grad_norm": 5, "use_early_stop": true, "patience": 50, "step_size": 1274, "task_level": 0, "use_curriculum_learning": true, "random_flip": true, "huber_delta": 2, "quan_delta": 0.25, "bidir": true, "far_mask_delta": 7, "dtw_delta": 5, "set_loss": "huber", "cluster_method": "kshape", "cand_key_days": 14 }
实验结果