vicuna-clip

Running on Zero

ford442 commited on Feb 11

Commit

2dbdb2a

verified ·

1 Parent(s): 97a0fb8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,36 +33,7 @@ def _preload_and_load_models():
 _preload_and_load_models()
-# Load the TTS model locally
-TTS_MODEL_PATH = "path/to/your/espnet/kan-bayashi_ljspeech_vits"  # Replace with the actual path
-TTS_CONFIG_PATH = os.path.join(TTS_MODEL_PATH, "config.yaml") # Replace with your config.yaml
-TTS_VOCAB_PATH = os.path.join(TTS_MODEL_PATH, "train.json") # Replace with your train.json
-# Load the configuration using yaml
-with open(TTS_CONFIG_PATH, "r") as f:
-    config = yaml.safe_load(f)
-# Correctly handle the threshold parameter
-threshold = config.get("threshold", 0.5)  # Get threshold, default to 0.5 if not found
-if isinstance(threshold, str):  # Check if it's a string
-    try:
-        threshold = float(threshold)  # Try converting to float
-    except ValueError:
-        threshold = 0.5  # If conversion fails, use a default value
-tts = Text2Speech(
-    TTS_MODEL_PATH,
-    TTS_CONFIG_PATH,
-    TTS_VOCAB_PATH,
-    device="cuda" if torch.cuda.is_available() else "cpu",
-    threshold=threshold  # Pass the corrected threshold value
-)
-fastspeech_config = get_fastspeech_config(TTS_CONFIG_PATH)
 @spaces.GPU(required=True)
 def process_audio(microphone, state, task="transcribe"):

 _preload_and_load_models()
+tts = Text2Speech.from_pretrained("espnet/kan-bayashi_ljspeech_vits")
 @spaces.GPU(required=True)
 def process_audio(microphone, state, task="transcribe"):