model: target: Models.interpretable_diffusion.gaussian_diffusion.Diffusion_TS params: seq_length: 192 feature_size: 137 n_layer_enc: 4 n_layer_dec: 4 d_model: 96 # 4 X 24 timesteps: 500 sampling_timesteps: 500 loss_type: 'l1' beta_schedule: 'cosine' n_heads: 4 mlp_hidden_times: 4 attn_pd: 0.5 resid_pd: 0.5 kernel_size: 1 padding_size: 0 solver: base_lr: 1.0e-5 max_epochs: 1000 results_folder: ./Checkpoints_solar_nips gradient_accumulate_every: 2 save_cycle: 100 # max_epochs // 10 ema: decay: 0.9 update_interval: 10 scheduler: target: engine.lr_sch.ReduceLROnPlateauWithWarmup params: factor: 0.5 patience: 300 min_lr: 1.0e-5 threshold: 1.0e-1 threshold_mode: rel warmup_lr: 8.0e-4 warmup: 100 verbose: False