basic: dataset: PEMSD7 device: cuda:0 mode: train model: DSANET seed: 2023 data: batch_size: 16 column_wise: false days_per_week: 7 horizon: 12 input_dim: 1 lag: 12 normalizer: std num_nodes: 883 steps_per_day: 288 test_ratio: 0.2 val_ratio: 0.2 model: batch_size: 16 d_inner: 256 d_k: 16 d_model: 128 d_v: 16 drop_prob: 0.1 input_dim: 1 local: 3 n_head: 4 n_kernels: 32 n_layers: 3 n_multiv: 883 num_nodes: 883 output_dim: 1 w_kernel: 1 window: 12 train: batch_size: 16 debug: false early_stop: true early_stop_patience: 15 epochs: 300 grad_norm: false log_step: 200 loss_func: mae lr_decay: false lr_decay_rate: 0.3 lr_decay_step: 5,20,40,70 lr_init: 0.003 mae_thresh: 0.0 mape_thresh: 0.0 max_grad_norm: 5 output_dim: 1 plot: false real_value: true weight_decay: 0