{ "dim_feedforward": 512, "hidden_dim": 128, "max_audio_seconds": 600, "nhead": 8, "num_layers": 2, "output_dim": 3 }