Merge pull request #2470 from makermelissa/main

makermelissa · web-flow · commit 2d124d1582e5 · 2023-04-04T08:00:13.000-07:00
Add ability to specify audio output device to ChatGPT Bear
diff --git a/ChatGPT_Bear/assistant.py b/ChatGPT_Bear/assistant.py
@@ -4,6 +4,7 @@
 
 import threading
 import os
+import sys
 
 from datetime import datetime, timedelta
 from queue import Queue
@@ -29,6 +30,7 @@
 
 # Azure Parameters
 AZURE_SPEECH_VOICE = "en-GB-OliverNeural"
+DEVICE_ID = None
 
 # Speech Recognition Parameters
 ENERGY_THRESHOLD = 1000  # Energy level for mic to detect
@@ -47,6 +49,12 @@
 speech_key = os.environ.get("SPEECH_KEY")
 service_region = os.environ.get("SPEECH_REGION")
 
+if openai.api_key is None or speech_key is None or service_region is None:
+    print(
+        "Please set the OPENAI_API_KEY, SPEECH_KEY, and SPEECH_REGION environment variables first."
+    )
+    sys.exit(1)
+
 speech_config = speechsdk.SpeechConfig(subscription=speech_key, region=service_region)
 speech_config.speech_synthesis_voice_name = AZURE_SPEECH_VOICE
 
@@ -157,10 +165,14 @@ def __init__(self, azure_speech_config):
         self.do_mouth_movement = False
         self._mouth_thread = threading.Thread(target=self.move_mouth, daemon=True)
         self._mouth_thread.start()
-
+        if DEVICE_ID is None:
+            audio_config = speechsdk.audio.AudioOutputConfig(use_default_speaker=True)
+        else:
+            audio_config = speechsdk.audio.AudioOutputConfig(device_name=DEVICE_ID)
         self._speech_synthesizer = speechsdk.SpeechSynthesizer(
-            speech_config=azure_speech_config
+            speech_config=azure_speech_config, audio_config=audio_config
         )
+
         self._speech_synthesizer.synthesizing.connect(self.start_moving_mouth)
         self._speech_synthesizer.synthesis_completed.connect(self.stop_moving_mouth)