forked from suryanshsk/Python-Voice-Assistant-Suryanshsk
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain_assistant.py
343 lines (294 loc) · 11.1 KB
/
main_assistant.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
import os
import subprocess
import sys
import logging
import webbrowser
import time
from datetime import datetime
from voice_recognition import recognize_speech
from text_to_speech import speak
from wikipedia_info import search_wikipedia
from weather_info import get_weather
from news_info import get_news
from jokes import tell_joke
from open_app import open_application
from open_files import *
from gemini_info import get_gemini_response
from song_data import SONGS
from website_data import WEBSITES
from collections import defaultdict
from reminderr import *
import threading
import json
from email_sender import send_bulk_email
USER_MAIL, USER_PASS, RECEPTIONISTS = "YOUR_EMAIL", "YOUR_PASSWORD", ["List of receptionists"]
### MAIN
"""
Guidelines for new ability/feature contributions
1. Please create your code into a separate file or a separate function.
2. Define your functions's inputs properly.
3. Add your function's tool name to the following TOOLS list, add a description, inputs and action : ( your function name )
4. list your tool properly in the last prompt in the main function to get inputs from gemini.
%% Please be as specific as possible and describe as good as poosible about your inputs, their formats
%% and the function's intention when to be called to get a proper output.
Thank You.
"""
def recognize_speech(timeout=10):
# Simulate speech recognition
return input("You: ")
def speak(message):
print(f"Assistant: {message}")
def just_Say(msg):
logging.info(msg)
speak(msg)
def abort(message):
global RUNNING
RUNNING = False
print(message)
def openfile(file):
logging.info("openinig....", file)
return open_file(file)
def play_music(song_name=""):
if song_name == "":
response = "Which song would you like to play?"
logging.info(response)
speak(response)
song_name = recognize_speech()
if song_name:
youtube_url = SONGS.get(song_name.lower())
if youtube_url:
response = f"Playing {song_name} in your browser."
logging.info(response)
speak(response)
webbrowser.open(youtube_url)
else:
response = "Song not found in the database."
logging.warning(response)
speak(response)
def open_website(website_name = ""):
if website_name == "":
response = "Which website would you like to open?"
logging.info(response)
speak(response)
website_name = recognize_speech()
if website_name:
website_url = WEBSITES.get(website_name.lower())
if website_url:
response = f"Opening {website_name} in your browser."
logging.info(response)
speak(response)
webbrowser.open(website_url)
else:
response = "Website not found in the database.Searching in google."
logging.warning(response)
speak(response)
from googlesearch import search
webs = search(website_name, advanced=True)
webbrowser.open(list(webs)[0].url)
TOOLS = [
{
'name': 'just_Say',
'description': '',
'inputs': ['msg'],
'action': just_Say
},
{
'name': 'get_news',
'description': 'Get news',
'inputs': [],
'action': get_news
},
{
'name': 'set_reminder',
'description': 'Sets a reminder based on user query.',
'inputs': ['input_text'],
'action': extract_reminder
},
{
'name': 'search_wikipedia',
'description': 'Searches Wikipedia for the given query.',
'inputs': ['query'],
'action': search_wikipedia
},
{
'name': 'get_weather',
'description': 'Fetches the weather information for the specified city.',
'inputs': ['city_name'],
'action': get_weather
},
{
'name': 'tell_joke',
'description': 'Tells a random joke.',
'inputs': [],
'action': tell_joke
},
{
'name': 'play_music',
'description': 'Plays music based on the song name provided.',
'inputs': ['song_name'],
'action': play_music
},
{
'name': 'open_website',
'description': 'Opens a website in the browser.',
'inputs': ['website_name'],
'action': open_website
},
{
'name': 'open_application',
'description': 'Opens an Application',
'inputs': ['app_name'],
'action': open_application
},
{
'name': 'abort',
'description': 'Aborts',
'inputs': ['message'],
'action': abort
},
{
'name': 'openfile',
'description': 'Opens files',
'inputs': ['file'],
'action': openfile
},
]
## MAIN
global REMINDERS
global RUNNING
REMINDERS = defaultdict(list)
# Setup logging
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
def get_greeting():
"""Get the appropriate greeting based on the current time."""
current_hour = datetime.now().hour
if current_hour < 12:
return "Good morning"
elif 12 <= current_hour < 18:
return "Good afternoon"
else:
return "Good evening"
def check_reminders():
global REMINDERS
while RUNNING:
current_time = datetime.now()
# Convert current time to ISO 8601 format
current_time_iso = current_time.isoformat()
if REMINDERS[current_time_iso]:
print("Reminder:", REMINDERS[current_time_iso])
logging.info("Reminder: " + REMINDERS[current_time_iso])
try:
send_bulk_email(USER_MAIL, USER_PASS, RECEPTIONISTS, "Your Assisstant", REMINDERS[current_time_iso])
logging.info("Sent reminder "+str(REMINDERS[current_time_iso])+" to "+str(RECEPTIONISTS))
except:
logging.error("Error sending reminder!")
del REMINDERS[current_time_iso]
time.sleep(10)
reminder_thread = threading.Thread(target=check_reminders)
import json
import logging
# Process the response from Gemini to extract the tool and its inputs
def process_gemini_response(response):
try:
response_data = json.loads(response)
tool_name = response_data['tool']
inputs = response_data['inputs']
return tool_name, inputs
except Exception as e:
logging.error(f"Error processing Gemini AI response: {e}")
return None, None
# Predefined headstart options
HEADSTART_OPTIONS = {
"1": "Get today's weather in New York.",
"2": "Set a reminder for tomorrow's meeting.",
"3": "Tell me a joke.",
"4": "Play some music.",
"5": "Search Wikipedia for Python programming."
}
# Function to display headstart options
def display_headstart_options():
print("Choose a headstart option:")
for key, option in HEADSTART_OPTIONS.items():
print(f"{key}: {option}")
# The main loop to handle user commands
def main():
global RUNNING
global REMINDERS
head_start_not_done = 0
while RUNNING:
logging.info("Listening for command...")
if head_start_not_done < 1:
display_headstart_options() # Display options before listening for commands
head_start_not_done = 1
try:
query = recognize_speech(timeout=10) # Replace with actual speech recognition function
except Exception as e:
logging.error(f"Error recognizing speech: {e}")
speak("Sorry, I didn't catch that.")
continue
if not query:
logging.warning("No command recognized, continuing...")
continue
query = query.lower()
logging.info(f"Recognized command: {query}")
# Check if the query matches any headstart option
if query in HEADSTART_OPTIONS.values() and head_start_not_done == 1:
head_start_not_done += 1
# Map the option to the appropriate command
option_key = next(key for key, option in HEADSTART_OPTIONS.items() if option == query)
query = HEADSTART_OPTIONS[option_key] # Use the selected headstart option
else:
head_start_not_done += 1
# Prompt Gemini AI to select tool and provide inputs
gemini_prompt = f"""
I have a list of tools that can perform specific actions. Based on the user query, select the appropriate tool from the list and extract the necessary inputs. Please respond in the following JSON format:
{{
"tool": "<tool_name>",
"inputs": {{
"input1": "<value1>",
"input2": "<value2>",
...
}}
}}
Here is the list of tools:
1. "just_Say": Requires "msg", a generic conversational response if none of the following tools fits best.
2. "set_reminder": Requires "input_text" (simply return enhanced the input Query which I give).
3. "search_wikipedia": Requires "query".
4. "get_weather": Requires "city_name".
5. "tell_joke": Requires no inputs.
6. "play_music": Requires "song_name".
7. "open_website": Requires "website_name" (return an empty string if no website is specified).
8. "open_application": Requires "app_name".
9. "get_news": Requires no inputs.
10. "openfile": Requires "file" (If path is there, give file name; if there is a location description, please build file path from description).
11. "abort": Requires a "message". Call this if the user wants to leave.
If the tool requires no inputs, leave the "inputs" field empty.
Query: "{query}"
"""
gemini_response = get_gemini_response(gemini_prompt)
tool_name, inputs = process_gemini_response(gemini_response)
print(tool_name, inputs)
if tool_name:
# Find the corresponding tool and call its action with the provided inputs
tool = next((t for t in TOOLS if t['name'] == tool_name), None)
if tool:
try:
tool['action'](**inputs)
except Exception as e:
logging.error(f"Error executing {tool_name}: {e}")
speak(f"Sorry, there was an error with {tool_name}.")
else:
logging.error(f"Tool {tool_name} not found.")
speak(f"Sorry, I couldn't find the tool {tool_name}.")
else:
speak("Sorry, I couldn't process the query.")
if __name__ == "__main__":
RUNNING = True
reminder_thread.start()
response = "Hello, I'm Your PA. How can I assist you today?"
logging.info(response)
speak(response)
try:
main()
except KeyboardInterrupt:
RUNNING = False