| { |
| "model_type":"vits", |
| "auto_map": { |
| "AutoModel": "modeling_vits.ModVitsModel" |
| }, |
| "sampling_rate": 24000, |
| "speaker_embedding_size": 256, |
| "vocab_size": 1260, |
| "speaker_names":["Assamese-Female", "Assamese-Male", "Bengali-Female", "Bengali-Male", "Bodo-Female", "Bodo-Male", "Dogri-Female", "Dogri-Male", "Kannada-Female", "Kannada-Male", "Maithili-Male", "Malayalam-Female", "Marathi-Female", "Marathi-Male", "Nepali-Female", "Punjabi-Female", "Punjabi-Male", "Sanskrit-Male", "Tamil-Female", "Telugu-Female"], |
| "emotion_names":["ALEXA", "ANGER", "BB", "BOOK", "CONV", "DIGI", "DISGUST", "FEAR", "HAPPY", "NEWS", "SAD", "SURPRISE", "UMANG", "WIKI"], |
| "undefined_emotion_index":[9,11,13] |
| } |
|
|