diff --git a/xinference/model/audio/core.py b/xinference/model/audio/core.py index b5ad532b6a..39d87df956 100644 --- a/xinference/model/audio/core.py +++ b/xinference/model/audio/core.py @@ -25,9 +25,9 @@ from .f5tts_mlx import F5TTSMLXModel from .fish_speech import FishSpeechModel from .funasr import FunASRModel +from .melotts import MeloTTSModel from .whisper import WhisperModel from .whisper_mlx import WhisperMLXModel -from .melotts import MeloTTSModel logger = logging.getLogger(__name__) diff --git a/xinference/model/audio/melotts.py b/xinference/model/audio/melotts.py index 06282cb992..bf1126fc76 100644 --- a/xinference/model/audio/melotts.py +++ b/xinference/model/audio/melotts.py @@ -53,6 +53,7 @@ def load(self): import os import sys + import nltk # English language requires download averaged_perceptron_tagger_eng