BirdSense / app.py
ashok2216's picture
Upload 20 files
feaeab3 verified
'''Copyright 2024 Ashok Kumar
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.'''
import os
import numpy as np
import warnings
import librosa
import streamlit as st
import tempfile
import json
from PIL import Image
import pandas as pd
from joblib import dump, load
import wikipedia
import requests
# import wikipediaapi
from sklearn.preprocessing import LabelEncoder
from tensorflow.keras.models import load_model
# import soundfile as sf
from audio_analysis import audio_signals
from audio_processing import extract_features
import os
from dotenv import load_dotenv
import json
import streamlit as st
from huggingface_hub import InferenceApi, login, InferenceClient
st.set_page_config(
page_title="BirdSense",
page_icon=":bird:",
initial_sidebar_state="expanded",
menu_items={
'Get Help': 'https://ashok2216-myportfolio-github-io.vercel.app/#contact',
'Report a bug': "https://ashok2216-myportfolio-github-io.vercel.app/#contact",
'About': "https://ashok2216-myportfolio-github-io.vercel.app/"
}
)
# Get the Hugging Face token from environment variables
load_dotenv()
hf_token = os.getenv("HF_TOKEN")
if hf_token is None:
raise ValueError("Hugging Face token not found. Please set the HF_TOKEN environment variable.")
# Authenticate with Hugging Face
login(hf_token)
# Model information and links
model_links = {
"Zephyr-7B": "HuggingFaceH4/zephyr-7b-beta"
}
model_info = {
"Zephyr-7B": {
'description': """Zephyr 7B is a Huggingface model, fine-tuned for helpful and instructive interactions.""",
'logo': 'https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha/resolve/main/thumbnail.png'
}
}
# Inference API Initialization
client = InferenceClient('HuggingFaceH4/zephyr-7b-beta')
# Reset conversation button
def reset_conversation():
return [
{"role": "system", "content": "You are a knowledgeable and empathetic ornithologist assistant providing accurate and relevant information based on user input."}
]
# Initialize conversation and chat history
messages = reset_conversation()
# Display chat history
# for message in messages:
# with st.chat_message(message["role"]):
# print(message["content"])
def respond(message, history, max_tokens, temperature, top_p):
# Prepare the list of messages for the chat completion
messages = [{"role": "system", "content": history[0]["content"]}]
for val in history:
if val["role"] == "user":
messages.append({"role": "user", "content": val["content"]})
elif val["role"] == "assistant":
messages.append({"role": "assistant", "content": val["content"]})
messages.append({"role": "user", "content": message})
# Generate response
response = ""
response_container = st.empty() # Placeholder to update the response text dynamically
for message in client.chat_completion(
messages,
max_tokens=max_tokens,
stream=True,
temperature=temperature,
top_p=top_p,
):
token = message.choices[0].delta.content
response += token
# response_container.text(response) # Stream the response
return response
# Load environment variables
load_dotenv()
hf_token = os.getenv("HF_TOKEN")
if hf_token is None:
raise ValueError("Hugging Face token not found. Please set the HF_TOKEN environment variable.")
# Authenticate with Hugging Face
login(hf_token)
image = Image.open('logo.PNG')
st.image(
image, width=250
)
st.subheader('Bird Species Classification')
# st.markdown('Sound of 114 Bird Species :bird: :penguin: :hatched_chick:')
st.header('', divider='rainbow')
@st.cache_data
def loaded_model(model_path):
return load_model(model_path)
@st.cache_data
def predict_class(audio_path, model):
extracted_feature = extract_features(audio_path)
extracted_feature = extracted_feature.reshape(1, 1, extracted_feature.shape[0])
prediction = model.predict(extracted_feature)
predicted_class_index = np.argmax(prediction)
print('HI',predicted_class_index)
# predicted_class_label = label_encoder.inverse_transform([predicted_class_index])[0]
return predicted_class_index
audio_file = st.file_uploader("Upload an Audio file", type=["mp3", "wav", "ogg"], accept_multiple_files=False)
# Load the model
model_path = 'bird_audio_classification_model.h5'
model = loaded_model(model_path)
class_file = open('classes.json', 'r').read()
labels_list = json.loads(class_file)
st.markdown('Download the Sample Audio here :point_down:')
st.page_link("https://dibird.com/", label="DiBird.com", icon="🐦")
st.subheader('Scientific Name of 114 Birds Species :bird:')
with st.container(height=300):
st.markdown(list(labels_list.values()))
# birds = pd.DataFrame(class_file)
# st.table(birds)
st.header('', divider='rainbow')
if audio_file is not None:
with tempfile.NamedTemporaryFile(delete=False) as tmp_file:
tmp_file.write(audio_file.read())
file_path = tmp_file.name
audio_data, sampling_rate = librosa.load(file_path)
st.audio(audio_data, sample_rate=sampling_rate)
st.success("Audio file successfully uploaded and stored temporally.")
audio_signals(file_path)
# Predict the class
y_predict = predict_class(file_path, model)
# Display predicted class
if str(y_predict) in labels_list.keys():
pred = labels_list[str(y_predict)][:-6]
st.subheader(f'Predicted Class: :rainbow[{pred}]')
st.image(wikipedia.page(pred).images[0], caption=labels_list[str(y_predict)][:-6], width=200)
st.markdown(wikipedia.summary(pred))
user_input = f"Explain about {pred} bird"
# Generate and display assistant response
if user_input:
response = respond(user_input, messages, max_tokens = 500, temperature = 0.70, top_p = 0.95)
st.markdown(response)
messages.append({"role": "assistant", "content": response})
st.page_link(wikipedia.page(pred).url, label="Explore more in Wikipedia.com", icon="🌎")
# st.session_state.messages.append({"role": "assistant", "content": response})
else:
st.write('Class not Found')
else:
st.markdown('File not Found!')