-
Notifications
You must be signed in to change notification settings - Fork 1
/
SpeechRecognizer.py
298 lines (255 loc) · 11.3 KB
/
SpeechRecognizer.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
""" =================================================================
File: SpeechRecognizer.py
This file contains code for the SpeechRecognizer class that can convert
the user's speech into text.
Authors: Anh Nguyen, Lily Irvin, Ryan Specht
Contributors: Emiliano Huerta, James Yang
==================================================================="""
from datetime import datetime
import time
import speech_recognition as sr
import gtts as gTTS
import playsound
import os
import random
import requests
from geopy.geocoders import Nominatim
# imports for grabWeather() method
import requests
import json
#imports for jokes
import pyjokes
import random
class SpeechRecognizer:
"""Represents a speech recognizer object"""
def __init__(self):
"""Sets up a speech recognizer object"""
self.recognizer = sr.Recognizer()
self.recognizer.energy_threshold = 300
def getSpeech(self):
"""
Records the user's speech and turn it into text form
Returns:
audio: the voice input from a user
"""
# Obtains audio from the microphone
with sr.Microphone() as source:
# we are defining our orignal voice data to nothing
self.recognizer.adjust_for_ambient_noise(source, duration=0.5)
audio = self.recognizer.listen(source)
# Recognizes speech using Google Speech Recognition
try:
print(self.recognizer.recognize_google(audio))
audio = self.recognizer.recognize_google(audio)
return audio
except sr.UnknownValueError:
self.kuri_speak("Sorry, I was unable to process what you said. Please try again")
return None
except sr.RequestError as e:
self.kuri_speak("Sorry, I am unable to connect to the internet at this moment. Please try again later")
return None
def kuri_speak(self, audio_string):
"""
This function uses google's text to speech module in order to convert the text message kuri generates to speech
Args:
audio_string (string): audio_string is a string that when passed to google's tts it is spoken
"""
tts = gTTS.gTTS(text=audio_string, lang='en')
randomNum = random.randint(1,100000)
audio_file = 'audio-' + str(randomNum) + '.mp3'
tts.save(audio_file)
playsound.playsound(audio_file)
print(audio_string)
os.remove(audio_file)
def response(self, voice_data):
"""
This function serves as the response interpretation from each user voice input which scan the voice data and checks to see if any
words that it may recognize are present
Args:
voice_data (string): this argument is a voice input that is converted to string to allow kuri to interpret and respond
"""
if voice_data is not None:
if "your name" in voice_data:
self.kuri_speak("My name is Kuri")
self.kuri_speak("is there anything else I can help you with?")
elif "what time is it" in voice_data:
self.kuri_speak(datetime.now().strftime("%I:%M:%S"))
self.kuri_speak("is there anything else I can help you with?")
elif "weather" in voice_data:
self.grabWeather()
elif "forecast" in voice_data:
self.grabWeather()
elif "joke" in voice_data:
self.grab_joke()
elif "news" in voice_data:
self.grabNews()
elif "sports" in voice_data:
self.grabSport()
elif "multiply" in voice_data:
self.calculateMult()
elif "divide" in voice_data:
self.calculateDiv()
elif "add" in voice_data:
self.calculateAdd()
elif "subtract" in voice_data:
self.calculateSub()
# elif "tip" in voice_data:
# self.calculateTip()
elif "dice" in voice_data:
self.rollDie()
elif "flip a coin" in voice_data:
self.odds()
elif "goodbye" in voice_data:
self.kuri_speak("Ok, Goodbye")
quit()
else:
self.kuri_speak("Sorry, I don't seem to know that command yet")
self.kuri_speak("Is there anything else I can help you with?")
while 1:
voice_data = self.getSpeech()
self.response(voice_data)
def odds(self):
randomInt = random.randint(1,2)
if randomInt == 1:
self.kuri_speak("It was heads")
else:
self.kuri_speak("It was Tails")
self.kuri_speak("Is there anything else I can help you with?")
def roleDie(self):
randomSide = random.randint(1,6)
self.kuri_speak("It landed on " + str(randomSide))
def grabWeather(self):
"""
Summary: This functions makes and api request call to weather api passing it parameters of the requested city gathering
weather data and returning it as a string for kuri to report back to the user
"""
# need to figure out a better way to grab weather
geolocator = Nominatim(user_agent="geoapiExercises")
self.kuri_speak("What city would you like the weather for?")
cityName = self.getSpeech()
location = geolocator.geocode(cityName)
if location is None:
self.kuri_speak("I did not get where you are")
latitude = location.latitude
longitude = location.longitude
weather_url = "https://api.weather.gov/points/{0:.4f},{1:.4f}".format(latitude,longitude)
response = requests.get(weather_url)
response.raise_for_status()
info = json.loads(response.text)
# forecastHourly_url = info["properties"]["forecastHourly"]
forecast_url = info["properties"]["forecast"]
response_2 = requests.get(forecast_url)
response_2.raise_for_status()
forecast_data = json.loads(response_2.text)
# now = datetime.now()
# current_time = int(now.strftime("%I"))
temperature = forecast_data['properties']['periods'][0]['temperature']
shortForecast = forecast_data['properties']['periods'][0]['shortForecast']
self.kuri_speak("The forcast today is " + str(temperature)+ 'Fahrenheit' + "and weather is" + shortForecast)
self.kuri_speak("Is there anything else I can help you with?")
def calculateMult(self):
self.kuri_speak("what is your first number?")
firstVar = int(self.getSpeech())
self.kuri_speak("what is your second number?")
secondVar = int(self.getSpeech())
finalVal = firstVar*secondVar
self.kuri_speak(str(finalVal))
self.kuri_speak("Is there anything else I can help you with?")
def calculateDiv(self):
self.kuri_speak("what is your first number?")
firstVar = int(self.getSpeech())
self.kuri_speak("what is your second number?")
secondVar = int(self.getSpeech())
finalVal = firstVar/secondVar
self.kuri_speak(str(finalVal))
self.kuri_speak("Is there anything else I can help you with?")
def calculateAdd(self):
self.kuri_speak("what is your first number?")
firstVar = int(self.getSpeech())
self.kuri_speak("what is your second number?")
secondVar = int(self.getSpeech())
finalVal = firstVar+secondVar
self.kuri_speak(str(finalVal))
self.kuri_speak("Is there anything else I can help you with?")
def calculateSub(self):
self.kuri_speak("what is your first number?")
firstVar = int(self.getSpeech())
self.kuri_speak("what is your second number?")
secondVar = int(self.getSpeech())
finalVal = firstVar-secondVar
self.kuri_speak(str(finalVal))
self.kuri_speak("Is there anything else I can help you with?")
# def calculateTip(self):
# self.kuri_speak("What is the total amount on your bill?")
# billAmount = self.getSpeech()
# self.kuri_speak("How much would you like to tip?")
# tipPercent = self.getSpeech()
# self.kuri_speak(str(int(billAmount)*(int(tipPercent)/100)) + " dollars is what you should tip")
# self.kuri_speak("Is there anything else I can help you with?")
def grab_joke(self, language="en"):
"""
Summary: This functions returns a joke that is withing the 3 following categories: neutral, twister, or all
Args:
language (str, default): This string defaults the language to english. can be changed to a different lagnauge. Defaults to "en".
"""
joke = pyjokes.get_joke(language, "neutral")
self.kuri_speak(str(joke))
self.kuri_speak("Is there anything else I can help you with?")
def grabNews(self):
"""
Summary: This functions make a query search to bbc-news gathering the top stories which will be returned and read to the user by Kuri
"""
# BBC news api
# following query parameters are used
# source, sortBy and apiKey
# we should source this api key to somewhere else so it isnt seen in the file -- fine for now
query_params = {
"source": "bbc-news",
"sortBy": "top",
"apiKey": "f2977f6aa47c40f2bba4dd1051c5d3f8"
}
main_url = " https://newsapi.org/v1/articles"
# fetching data in json format
res = requests.get(main_url, params=query_params)
open_bbc_page = res.json()
# getting all articles in a string article
article = open_bbc_page["articles"]
# empty list which will
# contain all trending news
results = []
for ar in article:
results.append(ar["title"])
for i in range(5):
# speak all trending news top 10 results
self.kuri_speak(str(results[i]))
self.kuri_speak("is there anything else I can help you with?")
def grabSport(self):
"""
Summary: This functions make a query search to bbc-news gathering the top stories which will be returned and read to the user by Kuri
"""
# BBC news api
# following query parameters are used
# source, sortBy and apiKey
# we should source this api key to somewhere else so it isnt seen in the file -- fine for now
query_params = {
"source": "ESPN",
"country": "us",
"category": "sports",
"apiKey": "f2977f6aa47c40f2bba4dd1051c5d3f8"
}
main_url = " https://newsapi.org/v2/top-headlines"
# fetching data in json format
res = requests.get(main_url, params=query_params)
print(res)
open_bbc_page = res.json()
# getting all articles in a string article
article = open_bbc_page["articles"]
# empty list which will
# contain all trending news
results = []
for ar in article:
results.append(ar["title"])
for i in range(5):
# speak all trending news top 10 results
self.kuri_speak(str(results[i]))
self.kuri_speak("is there anything else I can help you with?")