Spaces:
Running
Running
File size: 1,762 Bytes
59ef847 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 |
"""
uv sync
uv pip install Flask
wget https://huggingface.co/thewh1teagle/phonikud-onnx/resolve/main/phonikud-1.0.int8.onnx
wget https://huggingface.co/thewh1teagle/phonikud-tts-checkpoints/resolve/main/model.onnx
wget https://huggingface.co/thewh1teagle/phonikud-tts-checkpoints/resolve/main/model.config.json
uv run ./examples/space_v1/app.py
"""
from flask import Flask, render_template, request, jsonify
from phonikud_tts import Phonikud, phonemize, Piper
import soundfile as sf
import base64
import io
app = Flask(__name__)
phonikud = Phonikud("phonikud-1.0.int8.onnx")
piper = Piper("model.onnx", "model.config.json")
@app.route("/")
def index():
return render_template("index.html")
@app.route("/generate", methods=["POST"])
def generate():
mode = request.form["mode"]
text = request.form.get("text", "")
phonemes = request.form.get("phonemes", "")
if mode == "text":
with_diacritics = phonikud.add_diacritics(text)
phonemes = phonemize(with_diacritics)
elif mode == "diacritics":
with_diacritics = text
phonemes = phonemize(with_diacritics)
else:
with_diacritics = None
samples, sample_rate = piper.create(phonemes, is_phonemes=True, length_scale=1.25)
buffer = io.BytesIO()
sf.write(buffer, samples, sample_rate, format="WAV")
buffer.seek(0)
b64_audio = base64.b64encode(buffer.read()).decode("utf-8")
data_uri = f"data:audio/wav;base64,{b64_audio}"
return jsonify({
"diacritics": with_diacritics,
"phonemes": phonemes,
"audio": data_uri
})
@app.route("/audio/<filename>")
def serve_audio(filename):
return app.send_static_file(filename)
if __name__ == "__main__":
app.run(debug=True, host="0.0.0.0", port=7860)
|