{ "activation_function": "gelu", "architectures": [ "PatchTSTForPrediction" ], "attention_dropout": 0.0, "bias": true, "channel_attention": true, "channel_consistent_masking": false, "channel_rope": false, "context_length": 512, "d_model": 512, "distribution_output": null, "do_mask_input": false, "dropout": 0.0, "ff_dropout": 0.0, "ffn_dim": 512, "head_dropout": 0.0, "huber_delta": 1.0, "init_std": 0.02, "loss": "mse", "mask_type": "random", "mask_value": 0, "max_wavelength": 500, "mode": "predict", "model_type": "patchtst", "norm_eps": 1e-05, "norm_type": "rmsnorm", "num_attention_heads": 8, "num_forecast_mask_patches": 3, "num_hidden_layers": 8, "num_input_channels": 1, "num_parallel_samples": 100, "num_poly_feats": 120, "num_rff": 256, "num_targets": 1, "output_range": null, "patch_length": 16, "patch_stride": 16, "path_dropout": 0.0, "poly_degrees": 2, "pooling_type": "mean", "positional_dropout": 0.0, "positional_encoding_type": "sincos", "pre_norm": true, "prediction_length": 128, "pretrained_encoder_path": null, "random_mask_ratio": 0.5, "rff_scale": 1.0, "rff_trainable": false, "rope_percent": 0.75, "scaling": "std", "share_embedding": true, "share_projection": true, "torch_dtype": "float32", "transformers_version": "4.40.1", "unmasked_channel_indices": null, "use_cls_token": false, "use_dynamics_embedding": true }