{ "model": { "vocos": { "input_channels": 128, "dim": 1024, "intermediate_dim": 4096, "num_layers": 30, "n_fft": 1920, "hop_size": 480, "padding": "same" } } }