-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathChatGPT_voice.py
129 lines (105 loc) · 3.35 KB
/
ChatGPT_voice.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
import os
import sys
import time
import openai
import pyaudio
import logging
import speech_recognition as sr
from gtts import gTTS
from functools import wraps
from pydub import AudioSegment
from pydub.playback import play
how_can_I_help = 'How can I help'
def handle_exception(func):
"""Decorator to handle exceptions."""
@wraps(func)
def wrapper(*args, **kwargs):
try:
return func(*args, **kwargs)
except Exception as e:
logging.error("Error: %s", e, exc_info=True)
sys.exit(1)
return wrapper
@handle_exception
def check_audio_devices():
"""Check if the audio input and output devices are properly configured."""
p = pyaudio.PyAudio()
input_device = p.get_default_input_device_info()
output_device = p.get_default_output_device_info()
if input_device is None:
logging.error("No audio input device found.")
sys.exit(1)
if output_device is None:
logging.error("No audio output device found.")
sys.exit(1)
logging.info("Audio input device: %s", input_device['name'])
logging.info("Audio output device: %s", output_device['name'])
@handle_exception
def voice_ChatGPT():
"""The main function for the voice interface."""
log_file = f"_{sys._getframe().f_code.co_name}_{time.strftime('%Y%m%d-%H%M%S')}.log"
logging.basicConfig(filename=log_file,
level=logging.DEBUG,
format='%(asctime)s %(levelname)s %(message)s',
datefmt='%Y-%m-%d %H:%M:%S')
# Set logging level to only display INFO messages inside the loop
logging.getLogger().setLevel(logging.INFO)
check_audio_devices()
# Initialize the speech recognizer and microphone
recognizer = sr.Recognizer()
microphone = sr.Microphone()
openai.api_key = os.getenv("OPENAI_API_KEY")
if openai.api_key is None:
logging.error("API key not found.")
return
while True:
try:
# Prompt the user for voice input
text_to_speech (how_can_I_help)
logging.info (how_can_I_help)
with microphone as source:
audio = recognizer.listen(source)
# Convert the audio to text
command = recognizer.recognize_google(audio, language="en-US")
logging.info("Command: %s", command)
if command.lower() in ["goodbye", "exit", "end program" ]:
text_to_speech ("Are you sure? to exit say yes")
with microphone as source:
audio = recognizer.listen(source)
if recognizer.recognize_google(audio, language="en-US").lower() == 'yes' :
logging.info("Goodbye!")
break
# Generate the response from OpenAI
response = openai.Completion.create(
engine="text-davinci-002",
prompt='You said: ' + command,
max_tokens=2048,
n=1,
stop=None,
temperature=0.5
)
response = response.choices[0].text
logging.info("Response: %s", response)
text_to_speech(response)
except sr.UnknownValueError:
logging.error("Sorry, I did not understand what you said.")
except sr.RequestError as e:
logging.error("Error while requesting results: %s", e)
finally :
# Set logging level back to original level outside the loop
logging.getLogger().setLevel(logging.DEBUG)
return log_file
@handle_exception
def text_to_speech(text):
"""Convert the text to speech."""
tts = gTTS(text=text, lang='en')
tts.save("tmp.mp3")
audio = AudioSegment.from_file("tmp.mp3")
play(audio)
if __name__ == '__main__':
log_file = voice_ChatGPT()
if os.path.exists(log_file) :
os.remove(log_file)
pass
else:
print(f"{log_file} file does not exist")