File size: 6,925 Bytes
feaeab3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 |
'''Copyright 2024 Ashok Kumar
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.'''
import os
import numpy as np
import warnings
import librosa
import streamlit as st
import tempfile
import json
from PIL import Image
import pandas as pd
from joblib import dump, load
import wikipedia
import requests
# import wikipediaapi
from sklearn.preprocessing import LabelEncoder
from tensorflow.keras.models import load_model
# import soundfile as sf
from audio_analysis import audio_signals
from audio_processing import extract_features
import os
from dotenv import load_dotenv
import json
import streamlit as st
from huggingface_hub import InferenceApi, login, InferenceClient
st.set_page_config(
page_title="BirdSense",
page_icon=":bird:",
initial_sidebar_state="expanded",
menu_items={
'Get Help': 'https://ashok2216-myportfolio-github-io.vercel.app/#contact',
'Report a bug': "https://ashok2216-myportfolio-github-io.vercel.app/#contact",
'About': "https://ashok2216-myportfolio-github-io.vercel.app/"
}
)
# Get the Hugging Face token from environment variables
load_dotenv()
hf_token = os.getenv("HF_TOKEN")
if hf_token is None:
raise ValueError("Hugging Face token not found. Please set the HF_TOKEN environment variable.")
# Authenticate with Hugging Face
login(hf_token)
# Model information and links
model_links = {
"Zephyr-7B": "HuggingFaceH4/zephyr-7b-beta"
}
model_info = {
"Zephyr-7B": {
'description': """Zephyr 7B is a Huggingface model, fine-tuned for helpful and instructive interactions.""",
'logo': 'https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha/resolve/main/thumbnail.png'
}
}
# Inference API Initialization
client = InferenceClient('HuggingFaceH4/zephyr-7b-beta')
# Reset conversation button
def reset_conversation():
return [
{"role": "system", "content": "You are a knowledgeable and empathetic ornithologist assistant providing accurate and relevant information based on user input."}
]
# Initialize conversation and chat history
messages = reset_conversation()
# Display chat history
# for message in messages:
# with st.chat_message(message["role"]):
# print(message["content"])
def respond(message, history, max_tokens, temperature, top_p):
# Prepare the list of messages for the chat completion
messages = [{"role": "system", "content": history[0]["content"]}]
for val in history:
if val["role"] == "user":
messages.append({"role": "user", "content": val["content"]})
elif val["role"] == "assistant":
messages.append({"role": "assistant", "content": val["content"]})
messages.append({"role": "user", "content": message})
# Generate response
response = ""
response_container = st.empty() # Placeholder to update the response text dynamically
for message in client.chat_completion(
messages,
max_tokens=max_tokens,
stream=True,
temperature=temperature,
top_p=top_p,
):
token = message.choices[0].delta.content
response += token
# response_container.text(response) # Stream the response
return response
# Load environment variables
load_dotenv()
hf_token = os.getenv("HF_TOKEN")
if hf_token is None:
raise ValueError("Hugging Face token not found. Please set the HF_TOKEN environment variable.")
# Authenticate with Hugging Face
login(hf_token)
image = Image.open('logo.PNG')
st.image(
image, width=250
)
st.subheader('Bird Species Classification')
# st.markdown('Sound of 114 Bird Species :bird: :penguin: :hatched_chick:')
st.header('', divider='rainbow')
@st.cache_data
def loaded_model(model_path):
return load_model(model_path)
@st.cache_data
def predict_class(audio_path, model):
extracted_feature = extract_features(audio_path)
extracted_feature = extracted_feature.reshape(1, 1, extracted_feature.shape[0])
prediction = model.predict(extracted_feature)
predicted_class_index = np.argmax(prediction)
print('HI',predicted_class_index)
# predicted_class_label = label_encoder.inverse_transform([predicted_class_index])[0]
return predicted_class_index
audio_file = st.file_uploader("Upload an Audio file", type=["mp3", "wav", "ogg"], accept_multiple_files=False)
# Load the model
model_path = 'bird_audio_classification_model.h5'
model = loaded_model(model_path)
class_file = open('classes.json', 'r').read()
labels_list = json.loads(class_file)
st.markdown('Download the Sample Audio here :point_down:')
st.page_link("https://dibird.com/", label="DiBird.com", icon="🐦")
st.subheader('Scientific Name of 114 Birds Species :bird:')
with st.container(height=300):
st.markdown(list(labels_list.values()))
# birds = pd.DataFrame(class_file)
# st.table(birds)
st.header('', divider='rainbow')
if audio_file is not None:
with tempfile.NamedTemporaryFile(delete=False) as tmp_file:
tmp_file.write(audio_file.read())
file_path = tmp_file.name
audio_data, sampling_rate = librosa.load(file_path)
st.audio(audio_data, sample_rate=sampling_rate)
st.success("Audio file successfully uploaded and stored temporally.")
audio_signals(file_path)
# Predict the class
y_predict = predict_class(file_path, model)
# Display predicted class
if str(y_predict) in labels_list.keys():
pred = labels_list[str(y_predict)][:-6]
st.subheader(f'Predicted Class: :rainbow[{pred}]')
st.image(wikipedia.page(pred).images[0], caption=labels_list[str(y_predict)][:-6], width=200)
st.markdown(wikipedia.summary(pred))
user_input = f"Explain about {pred} bird"
# Generate and display assistant response
if user_input:
response = respond(user_input, messages, max_tokens = 500, temperature = 0.70, top_p = 0.95)
st.markdown(response)
messages.append({"role": "assistant", "content": response})
st.page_link(wikipedia.page(pred).url, label="Explore more in Wikipedia.com", icon="🌎")
# st.session_state.messages.append({"role": "assistant", "content": response})
else:
st.write('Class not Found')
else:
st.markdown('File not Found!')
|