-
Notifications
You must be signed in to change notification settings - Fork 0
/
gptinterface_V1.1_GUI_Refactored.py
234 lines (187 loc) · 8.67 KB
/
gptinterface_V1.1_GUI_Refactored.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
import tkinter as tk
import threading
import pyaudio
import wave
import speech_recognition as sr
import openai
import pyttsx3
import subprocess
from tkinter import scrolledtext
from time import sleep
openai.api_key = ""
# Change this to the GPT-3.5 Turbo model you want to use
model_engine = "gpt-3.5-turbo"
class GUI:
def __init__(self):
self.root = tk.Tk()
self.root.title("JAMES: AI Personal Assistant")
self.root.geometry("500x600")
# Create UI elements
self.conversation = scrolledtext.ScrolledText(self.root, wrap="word")
self.conversation.configure(
font=("Calibri", 12), bg="#F7F7F7", fg="#000000", padx=10, pady=10)
self.conversation.pack(side="top", fill="both", expand=True)
# Configure the tag for right alignment
self.conversation.tag_config("right", justify='right')
self.conversation.tag_config("left", justify='left')
self.speak_button = tk.Button(
self.root, text="Speak", command=self.toggle_recording)
self.speak_button.configure(
font=("Arial", 14), bg="#4CAF50", fg="#FFFFFF")
self.speak_button.pack(side="bottom", pady=10)
# Recording related
self.recording = False
self.frames = []
self.chunk = 1024
self.format = pyaudio.paInt16
self.channels = 1
self.rate = 44100
self.filename = "recording.wav"
self.p = pyaudio.PyAudio()
self.stream = None
self.event = threading.Event()
self.conversationHistory = [
{"role": "system", "content": "You are JAMES, an AI personal assistant"}]
self.first_Prompt = True
self.root.mainloop()
def toggle_recording(self):
self.recording = not self.recording
if self.recording:
self.start_recording()
self.speak_button.config(text="Stop")
self.speak_button.configure(
font=("Arial", 14), bg="#FF0000", fg="#FFFFFF")
else:
self.stop_recording()
self.speak_button.config(text="Record")
self.speak_button.configure(
font=("Arial", 14), bg="#4CAF50", fg="#FFFFFF")
def start_recording(self):
self.frames = []
self.stream = self.p.open(format=self.format,
channels=self.channels,
rate=self.rate,
input=True,
frames_per_buffer=self.chunk)
self.event.clear()
threading.Thread(target=self.record_frames).start()
def stop_recording(self):
try:
self.stream.stop_stream()
self.event.set()
self.save_recording()
self.convert_to_text()
threading.Thread(target=self.converse_with_chatgpt).start()
except Exception as e:
print(
'Error occured while converting speech to text and executing the command. More info : ' + str(e))
def record_frames(self):
while not self.event.is_set():
data = self.stream.read(self.chunk)
self.frames.append(data)
def save_recording(self):
with wave.open(self.filename, 'wb') as wf:
wf.setnchannels(self.channels)
wf.setsampwidth(self.p.get_sample_size(self.format))
wf.setframerate(self.rate)
wf.writeframes(b''.join(self.frames))
def remove_code_from_response(self):
temp_answer = self.answer
for command in self.commands:
temp_answer = str(temp_answer).replace("*" + command + "*", "")
print("filtered response: " + temp_answer)
return temp_answer
def get_commands_from_response(self):
self.commands = []
start_idx = 0
while start_idx < len(self.answer):
start_idx = self.answer.find("*", start_idx)
if start_idx == -1:
break
end_idx = self.answer.find("*", start_idx + 1)
if end_idx == -1:
break
command = self.answer[start_idx+1:end_idx]
self.commands.append(command)
start_idx = end_idx + 1
def execute_commands_in_cmd_window_and_get_output(self):
self.cmdoutput = ""
process = subprocess.run(
' & '.join(self.commands), shell=True, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)
output = process.stdout.decode('utf-8')
if (len(output) != 0):
self.cmdoutput = output
print("Generated output: " + self.cmdoutput)
def get_gpt_response_for_conversation(self):
response = openai.ChatCompletion.create(
model=model_engine,
messages=self.conversationHistory,
max_tokens=512,
temperature=0.2
)
self.answer = response['choices'][0]['message']['content']
def gui_print_user_first_prompt(self):
if (self.first_Prompt == True):
self.first_Prompt = False
else:
self.conversation.insert(
tk.END, "\n--------------------------------------------------------------------------------------------", "left")
self.conversation.insert(tk.END, "\nUser : " + self.text, "right")
self.conversation.see(tk.END)
def gui_print_gpt_first_response(self):
self.conversation.insert(
tk.END, "\n--------------------------------------------------------------------------------------------", "left")
self.conversation.insert(
tk.END, "\nGPT: " + self.answer, "left")
self.conversation.see(tk.END)
def gui_print_cmd_first_response(self):
self.conversation.insert(
tk.END, "\n--------------------------------------------------------------------------------------------", "left")
self.conversation.insert(
tk.END, "\nCMD OUTPUT: " + self.cmdoutput, "right")
self.conversation.see(tk.END)
def convert_to_text(self):
r = sr.Recognizer()
with sr.AudioFile(self.filename) as source:
audio_data = r.record(source)
# Speech to text
self.text = r.recognize_google(audio_data)
def converse_with_chatgpt(self):
# Initialize Text to speech
engine = pyttsx3.init()
# AI Instructions and user prompt
self.conversationHistory.append({"role": "user", "content": "You have to strictly follow these instructions while generating a response : 1) Response should be as concise and short as possible 2) When asked to perform a task which can be done using windows command prompt, Only respond with the commands required to do so and nothing else. Each command should start with `* and end with *` and should not contain any new lines or quotes. Generated commands will be executed on users computer and output if any will be given to you by user. If given, use that output to inform user about status of completion of given task else assume the task to be completed and inform the user. For all other prompts respond as you would normally. Prompt : " + self.text})
# Print users prompt in GUI
self.gui_print_user_first_prompt()
# Get response from gpt for users prompt
self.get_gpt_response_for_conversation()
# Append response in conversation history
self.conversationHistory.append(
{"role": "assistant", "content": self.answer})
# print gpt first response on GUI
self.gui_print_gpt_first_response()
# Extract commands from GPT response
self.get_commands_from_response()
# Play GPT's response using text to speech
engine.say(self.remove_code_from_response())
if (len(self.commands) != 0):
# Execute the commands in cmd window
self.execute_commands_in_cmd_window_and_get_output()
# add the output as a separate message in the conversation history
self.conversationHistory.append(
{"role": "user", "content": "CMD OUTPUT: " + self.cmdoutput})
# display the CMD output in the GUI
self.gui_print_cmd_first_response()
# Get GPT second response for conversation
self.get_gpt_response_for_conversation()
# Append GPT second response
self.conversationHistory.append(
{"role": "assistant", "content": self.answer})
# print second response on gui window
self.gui_print_gpt_first_response()
# Get commands for the reponse and remove those commands from text to speech
self.get_commands_from_response()
engine.say(self.remove_code_from_response())
engine.runAndWait()
if __name__ == "__main__":
GUI()