fixed speech blocking main thread

2025-12-18 22:44:21 +01:00 · 2023-04-05 15:50:28 +02:00
parent 62dfd84599
commit 73bf928c1d
2 changed files with 23 additions and 14 deletions
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,7 +1,7 @@
 beautifulsoup4
 colorama==0.4.6
 openai==0.27.2
-playsound==1.3.0
+playsound==1.2.2
 python-dotenv==1.0.0
 pyyaml==6.0
 readability-lxml==0.8.1
--- a/scripts/speak.py
+++ b/scripts/speak.py
@@ -4,6 +4,8 @@ import requests
 from config import Config
 cfg = Config()
 import gtts
 import threading
 from threading import Lock
 # TODO: Nicer names for these ids
@@ -14,17 +16,20 @@ tts_headers = {
    "xi-api-key": cfg.elevenlabs_api_key
 }
 mutex_lock = Lock() # Ensure only one sound is played at a time
 def eleven_labs_speech(text, voice_index=0):
    tts_url = "https://api.elevenlabs.io/v1/text-to-speech/{voice_id}".format(
        voice_id=voices[voice_index])
-    formatted_message = {"text": text}
+    formatted_message = {"text": text, "voice_settings": {"stability": 0.05, "similarity_boost": 0.8}}
    response = requests.post(
        tts_url, headers=tts_headers, json=formatted_message)
    if response.status_code == 200:
        with mutex_lock:
            with open("speech.mpeg", "wb") as f:
                f.write(response.content)
-        playsound("speech.mpeg")
+            playsound("speech.mpeg", True)
            os.remove("speech.mpeg")
        return True
    else:
@@ -34,11 +39,13 @@ def eleven_labs_speech(text, voice_index=0):
 def gtts_speech(text):
    tts = gtts.gTTS(text)
    with mutex_lock:
        tts.save("speech.mp3")
-    playsound("speech.mp3")
+        playsound("speech.mp3", True)
        os.remove("speech.mp3")
 def say_text(text, voice_index=0):
    def speak():
        if not cfg.elevenlabs_api_key:
            gtts_speech(text)
        else:
@@ -46,3 +53,5 @@ def say_text(text, voice_index=0):
            if not success:
                gtts_speech(text)
    thread = threading.Thread(target=speak)
    thread.start()