{ "activation_dropout": 0.1, "activation_function": "gelu", "architectures": [ "TimeSeriesTransformerForPrediction" ], "attention_dropout": 0.1, "cardinality": [ 366 ], "context_length": 60, "d_model": 32, "decoder_attention_heads": 2, "decoder_ffn_dim": 32, "decoder_layerdrop": 0.1, "decoder_layers": 4, "distribution_output": "student_t", "dropout": 0.1, "embedding_dimension": [ 4 ], "encoder_attention_heads": 2, "encoder_ffn_dim": 32, "encoder_layerdrop": 0.1, "encoder_layers": 4, "feature_size": 40, "init_std": 0.02, "input_size": 1, "is_encoder_decoder": true, "lags_sequence": [ 1, 2, 3, 4, 5, 6, 7, 8, 13, 14, 15, 20, 21, 22, 27, 28, 29, 30, 31, 56, 84, 363, 364, 365, 727, 728, 729, 1091, 1092, 1093 ], "loss": "nll", "model_type": "time_series_transformer", "num_dynamic_real_features": 0, "num_parallel_samples": 100, "num_static_categorical_features": 1, "num_static_real_features": 0, "num_time_features": 4, "prediction_length": 30, "scaling": "mean", "torch_dtype": "float32", "transformers_version": "4.28.0", "use_cache": true }