model: target: Models.interpretable_diffusion.gaussian_diffusion.Diffusion_TS params: seq_length: 160 feature_size: 5 n_layer_enc: 1 n_layer_dec: 2 d_model: 64 # 4 X 16 timesteps: 200 sampling_timesteps: 200 loss_type: 'l1' beta_schedule: 'cosine' n_heads: 4 mlp_hidden_times: 4 attn_pd: 0.1 resid_pd: 0.1 kernel_size: 5 padding_size: 2 solver: base_lr: 1.0e-5 max_epochs: 1000 results_folder: ./Checkpoints_syn gradient_accumulate_every: 2 save_cycle: 100 # max_epochs // 10 ema: decay: 0.99 update_interval: 10 scheduler: target: engine.lr_sch.ReduceLROnPlateauWithWarmup params: factor: 0.5 patience: 200 min_lr: 1.0e-5 threshold: 1.0e-1 threshold_mode: rel warmup_lr: 8.0e-4 warmup: 100 verbose: False