basic: dataset: BJTaxi-OutFlow device: cuda:0 mode: train model: DSANET seed: 2023 data: batch_size: 32 column_wise: false days_per_week: 7 horizon: 24 input_dim: 1 lag: 24 normalizer: std num_nodes: 1024 steps_per_day: 48 test_ratio: 0.2 val_ratio: 0.2 model: batch_size: 64 d_inner: 2048 d_k: 64 d_model: 512 d_v: 64 drop_prob: 0.1 input_dim: 1 local: 3 n_head: 8 n_kernels: 32 n_layers: 6 n_multiv: 1024 num_nodes: 1024 output_dim: 1 w_kernel: 1 window: 24 train: batch_size: 32 debug: false early_stop: true early_stop_patience: 15 epochs: 300 grad_norm: false log_step: 200 loss_func: mae lr_decay: false lr_decay_rate: 0.3 lr_decay_step: 5,20,40,70 lr_init: 0.003 mae_thresh: 0.0 mape_thresh: 0.0 max_grad_norm: 5 output_dim: 1 plot: false real_value: true weight_decay: 0