Update app.py
Browse files
app.py
CHANGED
@@ -1,17 +1,18 @@
|
|
1 |
from flask import Flask, render_template_string, request, jsonify
|
2 |
-
|
3 |
-
import speech_recognition as sr # Import speech recognition
|
4 |
from tempfile import NamedTemporaryFile
|
5 |
-
import ffmpeg
|
6 |
import os
|
|
|
|
|
|
|
7 |
|
|
|
8 |
app = Flask(__name__)
|
9 |
|
10 |
-
#
|
11 |
-
|
12 |
-
user_preferences = {"diet": "all"} # Default to all
|
13 |
|
14 |
-
# HTML
|
15 |
html_code = """
|
16 |
<!DOCTYPE html>
|
17 |
<html lang="en">
|
@@ -75,60 +76,69 @@ html_code = """
|
|
75 |
<body>
|
76 |
<h1>AI Dining Assistant</h1>
|
77 |
<button class="mic-button" id="mic-button">🎤</button>
|
78 |
-
<div class="status" id="status">Press the mic button to start
|
79 |
<div class="response" id="response" style="display: none;">Response will appear here...</div>
|
80 |
<script>
|
81 |
const micButton = document.getElementById('mic-button');
|
82 |
const status = document.getElementById('status');
|
83 |
const response = document.getElementById('response');
|
84 |
-
if (!window.MediaRecorder) {
|
85 |
-
alert("Your browser does not support audio recording.");
|
86 |
-
}
|
87 |
let mediaRecorder;
|
88 |
let audioChunks = [];
|
89 |
-
|
90 |
-
|
91 |
-
|
92 |
-
|
93 |
-
|
94 |
-
|
95 |
-
|
96 |
-
audioChunks = [];
|
97 |
-
mediaRecorder.ondataavailable = event => {
|
98 |
-
audioChunks.push(event.data);
|
99 |
-
};
|
100 |
-
mediaRecorder.onstop = async () => {
|
101 |
-
const audioBlob = new Blob(audioChunks, { type: 'audio/wav; codecs=LINEAR16' });
|
102 |
-
const formData = new FormData();
|
103 |
-
formData.append('audio', audioBlob);
|
104 |
-
status.textContent = 'Processing...';
|
105 |
-
status.classList.remove('listening');
|
106 |
-
try {
|
107 |
-
const result = await fetch('/process-audio', {
|
108 |
-
method: 'POST',
|
109 |
-
body: formData,
|
110 |
-
});
|
111 |
-
const data = await result.json();
|
112 |
-
response.textContent = data.response;
|
113 |
-
response.style.display = 'block';
|
114 |
-
status.textContent = 'Press the mic button to start listening...';
|
115 |
-
// Use browser text-to-speech
|
116 |
-
const utterance = new SpeechSynthesisUtterance(data.response);
|
117 |
-
speechSynthesis.speak(utterance);
|
118 |
-
} catch (error) {
|
119 |
-
response.textContent = 'Error occurred. Please try again.';
|
120 |
-
response.style.display = 'block';
|
121 |
-
status.textContent = 'Press the mic button to start listening...';
|
122 |
-
}
|
123 |
-
};
|
124 |
-
setTimeout(() => {
|
125 |
-
mediaRecorder.stop();
|
126 |
-
}, 5000); // Stop recording after 5 seconds
|
127 |
-
})
|
128 |
-
.catch(err => {
|
129 |
-
status.textContent = 'Microphone access denied.';
|
130 |
-
});
|
131 |
});
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
132 |
</script>
|
133 |
</body>
|
134 |
</html>
|
@@ -141,37 +151,73 @@ def index():
|
|
141 |
@app.route('/process-audio', methods=['POST'])
|
142 |
def process_audio():
|
143 |
try:
|
144 |
-
|
145 |
-
|
146 |
-
|
|
|
|
|
|
|
147 |
audio_file.save(temp_file.name)
|
148 |
-
|
149 |
-
|
|
|
|
|
|
|
|
|
150 |
converted_file = NamedTemporaryFile(delete=False, suffix=".wav")
|
151 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
152 |
|
|
|
153 |
recognizer = sr.Recognizer()
|
154 |
with sr.AudioFile(converted_file.name) as source:
|
155 |
audio_data = recognizer.record(source)
|
156 |
command = recognizer.recognize_google(audio_data)
|
|
|
157 |
response = process_command(command)
|
158 |
|
159 |
-
# Clean up temporary files
|
160 |
-
os.unlink(temp_file.name)
|
161 |
-
os.unlink(converted_file.name)
|
162 |
return jsonify({"response": response})
|
|
|
|
|
|
|
|
|
|
|
163 |
except Exception as e:
|
|
|
164 |
return jsonify({"response": f"An error occurred: {str(e)}"})
|
165 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
166 |
def process_command(command):
|
167 |
"""Process the user's voice command and return a response."""
|
168 |
-
global orders
|
169 |
command = command.lower()
|
170 |
if "menu" in command:
|
171 |
-
return
|
|
|
|
|
|
|
|
|
|
|
172 |
elif "order" in command:
|
173 |
-
return "Your order has been placed."
|
174 |
-
|
|
|
|
|
175 |
|
176 |
if __name__ == "__main__":
|
177 |
app.run(host="0.0.0.0", port=7860)
|
|
|
1 |
from flask import Flask, render_template_string, request, jsonify
|
2 |
+
import speech_recognition as sr
|
|
|
3 |
from tempfile import NamedTemporaryFile
|
|
|
4 |
import os
|
5 |
+
import ffmpeg
|
6 |
+
import logging
|
7 |
+
from werkzeug.exceptions import BadRequest
|
8 |
|
9 |
+
# Initialize Flask App
|
10 |
app = Flask(__name__)
|
11 |
|
12 |
+
# Set up logging
|
13 |
+
logging.basicConfig(level=logging.INFO)
|
|
|
14 |
|
15 |
+
# HTML Template for Frontend
|
16 |
html_code = """
|
17 |
<!DOCTYPE html>
|
18 |
<html lang="en">
|
|
|
76 |
<body>
|
77 |
<h1>AI Dining Assistant</h1>
|
78 |
<button class="mic-button" id="mic-button">🎤</button>
|
79 |
+
<div class="status" id="status">Press the mic button to start the conversation...</div>
|
80 |
<div class="response" id="response" style="display: none;">Response will appear here...</div>
|
81 |
<script>
|
82 |
const micButton = document.getElementById('mic-button');
|
83 |
const status = document.getElementById('status');
|
84 |
const response = document.getElementById('response');
|
|
|
|
|
|
|
85 |
let mediaRecorder;
|
86 |
let audioChunks = [];
|
87 |
+
let isConversationActive = false;
|
88 |
+
|
89 |
+
micButton.addEventListener('click', () => {
|
90 |
+
if (!isConversationActive) {
|
91 |
+
isConversationActive = true;
|
92 |
+
startConversation();
|
93 |
+
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
94 |
});
|
95 |
+
|
96 |
+
function startConversation() {
|
97 |
+
status.textContent = 'Listening...';
|
98 |
+
startListening();
|
99 |
+
}
|
100 |
+
|
101 |
+
function startListening() {
|
102 |
+
navigator.mediaDevices.getUserMedia({ audio: true }).then(stream => {
|
103 |
+
mediaRecorder = new MediaRecorder(stream, { mimeType: 'audio/webm;codecs=opus' });
|
104 |
+
mediaRecorder.start();
|
105 |
+
audioChunks = [];
|
106 |
+
mediaRecorder.ondataavailable = event => audioChunks.push(event.data);
|
107 |
+
mediaRecorder.onstop = async () => {
|
108 |
+
const audioBlob = new Blob(audioChunks, { type: 'audio/webm' });
|
109 |
+
const formData = new FormData();
|
110 |
+
formData.append('audio', audioBlob);
|
111 |
+
|
112 |
+
status.textContent = 'Processing...';
|
113 |
+
try {
|
114 |
+
const result = await fetch('/process-audio', { method: 'POST', body: formData });
|
115 |
+
const data = await result.json();
|
116 |
+
response.textContent = data.response;
|
117 |
+
response.style.display = 'block';
|
118 |
+
|
119 |
+
const utterance = new SpeechSynthesisUtterance(data.response);
|
120 |
+
speechSynthesis.speak(utterance);
|
121 |
+
|
122 |
+
if (data.response.includes("Goodbye")) {
|
123 |
+
status.textContent = 'Conversation ended. Press the mic button to start again.';
|
124 |
+
isConversationActive = false;
|
125 |
+
} else {
|
126 |
+
status.textContent = 'Listening...';
|
127 |
+
setTimeout(startListening, 1000); // Continue listening
|
128 |
+
}
|
129 |
+
} catch (error) {
|
130 |
+
response.textContent = 'Error occurred. Please try again.';
|
131 |
+
response.style.display = 'block';
|
132 |
+
status.textContent = 'Press the mic button to restart the conversation.';
|
133 |
+
isConversationActive = false;
|
134 |
+
}
|
135 |
+
};
|
136 |
+
setTimeout(() => mediaRecorder.stop(), 5000); // Stop recording after 5 seconds
|
137 |
+
}).catch(() => {
|
138 |
+
status.textContent = 'Microphone access denied.';
|
139 |
+
isConversationActive = false;
|
140 |
+
});
|
141 |
+
}
|
142 |
</script>
|
143 |
</body>
|
144 |
</html>
|
|
|
151 |
@app.route('/process-audio', methods=['POST'])
|
152 |
def process_audio():
|
153 |
try:
|
154 |
+
# Validate audio file
|
155 |
+
audio_file = request.files.get('audio')
|
156 |
+
if not audio_file:
|
157 |
+
raise BadRequest("No audio file provided.")
|
158 |
+
|
159 |
+
temp_file = NamedTemporaryFile(delete=False, suffix=".webm")
|
160 |
audio_file.save(temp_file.name)
|
161 |
+
logging.info(f"Saved input audio to {temp_file.name}")
|
162 |
+
|
163 |
+
if os.path.getsize(temp_file.name) == 0:
|
164 |
+
raise BadRequest("Uploaded audio file is empty.")
|
165 |
+
|
166 |
+
# Convert audio to PCM WAV format
|
167 |
converted_file = NamedTemporaryFile(delete=False, suffix=".wav")
|
168 |
+
try:
|
169 |
+
ffmpeg.input(temp_file.name).output(
|
170 |
+
converted_file.name, acodec='pcm_s16le', ac=1, ar='16000'
|
171 |
+
).run(overwrite_output=True)
|
172 |
+
except Exception as ffmpeg_error:
|
173 |
+
logging.error(f"FFmpeg conversion error: {str(ffmpeg_error)}")
|
174 |
+
return jsonify({"response": "Audio conversion failed. Please try again."})
|
175 |
+
|
176 |
+
logging.info(f"Converted audio saved to {converted_file.name}")
|
177 |
|
178 |
+
# Recognize speech
|
179 |
recognizer = sr.Recognizer()
|
180 |
with sr.AudioFile(converted_file.name) as source:
|
181 |
audio_data = recognizer.record(source)
|
182 |
command = recognizer.recognize_google(audio_data)
|
183 |
+
logging.info(f"Recognized command: {command}")
|
184 |
response = process_command(command)
|
185 |
|
|
|
|
|
|
|
186 |
return jsonify({"response": response})
|
187 |
+
|
188 |
+
except BadRequest as br:
|
189 |
+
logging.error(f"Bad request error: {br}")
|
190 |
+
return jsonify({"response": f"Bad Request: {str(br)}"})
|
191 |
+
|
192 |
except Exception as e:
|
193 |
+
logging.error(f"Error processing audio: {e}")
|
194 |
return jsonify({"response": f"An error occurred: {str(e)}"})
|
195 |
|
196 |
+
finally:
|
197 |
+
# Clean up temporary files
|
198 |
+
try:
|
199 |
+
if os.path.exists(temp_file.name):
|
200 |
+
os.unlink(temp_file.name)
|
201 |
+
if os.path.exists(converted_file.name):
|
202 |
+
os.unlink(converted_file.name)
|
203 |
+
except Exception as cleanup_error:
|
204 |
+
logging.error(f"Error cleaning up files: {cleanup_error}")
|
205 |
+
|
206 |
def process_command(command):
|
207 |
"""Process the user's voice command and return a response."""
|
|
|
208 |
command = command.lower()
|
209 |
if "menu" in command:
|
210 |
+
return (
|
211 |
+
"Here is our menu: "
|
212 |
+
"South Indian dishes include Idli, Dosa, Vada, Pongal, Biryani, and Sambar Rice. "
|
213 |
+
"North Indian dishes include Butter Chicken, Paneer Butter Masala, Naan, Dal Makhani, Chole Bhature, and Rajma Chawal. "
|
214 |
+
"What would you like to order?"
|
215 |
+
)
|
216 |
elif "order" in command:
|
217 |
+
return "Your order has been placed. Would you like anything else?"
|
218 |
+
elif "no" in command or "nothing" in command:
|
219 |
+
return "Goodbye! Thank you for using AI Dining Assistant."
|
220 |
+
return "Sorry, I didn't understand your request. Please ask about the menu or place an order."
|
221 |
|
222 |
if __name__ == "__main__":
|
223 |
app.run(host="0.0.0.0", port=7860)
|