Spaces:

RathodHarish
/

HealthVoiceAnalyzer

Running

App Files Files Community

RathodHarish commited on 3 days ago

Commit

a6dea81

verified ·

1 Parent(s): b3db979

Update app.py

Browse files

Files changed (1) hide show

app.py +85 -31

app.py CHANGED Viewed

@@ -1,11 +1,11 @@
 import gradio as gr
 import librosa
 import numpy as np
-import torch
-from transformers import Wav2Vec2Processor, Wav2Vec2Model
-from simple_salesforce import Salesforce
 import os
 from datetime import datetime
 # Salesforce credentials (store securely in environment variables)
 SF_USERNAME = os.getenv("SF_USERNAME", "your_salesforce_username")
@@ -13,6 +13,9 @@ SF_PASSWORD = os.getenv("SF_PASSWORD", "your_salesforce_password")
 SF_SECURITY_TOKEN = os.getenv("SF_SECURITY_TOKEN", "your_salesforce_security_token")
 SF_INSTANCE_URL = os.getenv("SF_INSTANCE_URL", "https://your-salesforce-instance.salesforce.com")
 # Initialize Salesforce connection
 try:
     sf = Salesforce(
@@ -25,54 +28,105 @@ except Exception as e:
     print(f"Failed to connect to Salesforce: {str(e)}")
     sf = None
-# Load Wav2Vec2 model for speech feature extraction
-processor = Wav2Vec2Processor.from_pretrained("facebook/wav2vec2-base-960h")
-model = Wav2Vec2Model.from_pretrained("facebook/wav2vec2-base-960h")
 def analyze_voice(audio_file):
     """Analyze voice for health indicators."""
     try:
-        # Load audio file
-        audio, sr = librosa.load(audio_file, sr=16000)
-        # Process audio for Wav2Vec2
-        inputs = processor(audio, sampling_rate=16000, return_tensors="pt", padding=True)
-        with torch.no_grad():
-            outputs = model(**inputs)
-        # Extract features (simplified for demo)
-        features = outputs.last_hidden_state.mean(dim=1).numpy()
-        # Adjusted thresholds for testing (lower to trigger feedback)
-        respiratory_score = np.mean(features)  # Mock score
-        mental_health_score = np.std(features)  # Mock score
-        feedback = ""
-        if respiratory_score > 0.1:  # Lowered from 0.5
-            feedback += "Possible respiratory issue detected; consult a doctor. "
-        if mental_health_score > 0.1:  # Lowered from 0.3
-            feedback += "Possible stress indicators detected; consider professional advice. "
-        if not feedback:
             feedback = "No significant health indicators detected."
-        feedback += "\n\n**Disclaimer**: This is not a diagnostic tool. Consult a healthcare provider for medical advice."
         # Store in Salesforce
         if sf:
-            store_in_salesforce(audio_file, feedback, respiratory_score, mental_health_score)
         return feedback
     except Exception as e:
         return f"Error processing audio: {str(e)}"
-def store_in_salesforce(audio_file, feedback, respiratory_score, mental_health_score):
     """Store analysis results in Salesforce."""
     try:
         sf.HealthAssessment__c.create({
             "AssessmentDate__c": datetime.utcnow().isoformat(),
             "Feedback__c": feedback,
-            "RespiratoryScore__c": float(respiratory_score),
-            "MentalHealthScore__c": float(mental_health_score),
             "AudioFileName__c": os.path.basename(audio_file)
         })
     except Exception as e:
@@ -80,7 +134,7 @@ def store_in_salesforce(audio_file, feedback, respiratory_score, mental_health_s
 def test_with_sample_audio():
     """Test the app with a sample audio file."""
-    sample_audio_path = "audio_samples/sample.wav"  # Or "audio_samples/common_voice_sample.wav"
     if os.path.exists(sample_audio_path):
         return analyze_voice(sample_audio_path)
     return "Sample audio file not found."
@@ -91,9 +145,9 @@ iface = gr.Interface(
     inputs=gr.Audio(type="filepath", label="Record or Upload Voice"),
     outputs=gr.Textbox(label="Health Assessment Feedback"),
     title="Health Voice Analyzer",
-    description="Record or upload a voice sample for preliminary health assessment. Supports English, Spanish, Hindi, Mandarin."
 )
 if __name__ == "__main__":
-    print(test_with_sample_audio())  # Run test on startup
     iface.launch(server_name="0.0.0.0", server_port=7860)

 import gradio as gr
+import requests
 import librosa
 import numpy as np
 import os
+import hashlib
 from datetime import datetime
+from simple_salesforce import Salesforce
 # Salesforce credentials (store securely in environment variables)
 SF_USERNAME = os.getenv("SF_USERNAME", "your_salesforce_username")
 SF_SECURITY_TOKEN = os.getenv("SF_SECURITY_TOKEN", "your_salesforce_security_token")
 SF_INSTANCE_URL = os.getenv("SF_INSTANCE_URL", "https://your-salesforce-instance.salesforce.com")
+# Hugging Face Inference API token (store in environment variables)
+HF_TOKEN = os.getenv("HF_TOKEN", "your_huggingface_token")
 # Initialize Salesforce connection
 try:
     sf = Salesforce(
     print(f"Failed to connect to Salesforce: {str(e)}")
     sf = None
+# Hugging Face API endpoints
+WHISPER_API_URL = "https://api-inference.huggingface.co/models/openai/whisper-tiny.en"
+SYMPTOM_API_URL = "https://api-inference.huggingface.co/models/abhirajeshbhai/symptom-2-disease-net"
+HEADERS = {"Authorization": f"Bearer {HF_TOKEN}"}
+def compute_file_hash(file_path):
+    """Compute MD5 hash of a file to check uniqueness."""
+    hash_md5 = hashlib.md5()
+    with open(file_path, "rb") as f:
+        for chunk in iter(lambda: f.read(4096), b""):
+            hash_md5.update(chunk)
+    return hash_md5.hexdigest()
+def transcribe_audio(audio_file):
+    """Transcribe audio using Whisper API."""
+    try:
+        with open(audio_file, "rb") as f:
+            data = f.read()
+        response = requests.post(WHISPER_API_URL, headers=HEADERS, data=data)
+        response.raise_for_status()
+        result = response.json()
+        transcription = result.get("text", "")
+        print(f"Transcription: {transcription}")
+        return transcription
+    except Exception as e:
+        print(f"Whisper API error: {str(e)}")
+        return f"Error transcribing audio: {str(e)}"
+def analyze_symptoms(text):
+    """Analyze symptoms using Symptom-2-Disease API."""
+    try:
+        payload = {"inputs": text}
+        response = requests.post(SYMPTOM_API_URL, headers=HEADERS, json=payload)
+        response.raise_for_status()
+        result = response.json()
+        if result and isinstance(result, list) and len(result) > 0:
+            prediction = result[0][0]["label"]
+            score = result[0][0]["score"]
+            print(f"Health Prediction: {prediction}, Score: {score:.4f}")
+            return prediction, score
+        return "No health condition predicted", 0.0
+    except Exception as e:
+        print(f"Symptom API error: {str(e)}")
+        return f"Error analyzing symptoms: {str(e)}", 0.0
 def analyze_voice(audio_file):
     """Analyze voice for health indicators."""
     try:
+        # Log audio file info
+        file_hash = compute_file_hash(audio_file)
+        print(f"Processing audio file: {audio_file}, Hash: {file_hash}")
+        # Load audio to verify format
+        audio, sr = librosa.load(audio_file, sr=16000)
+        print(f"Audio shape: {audio.shape}, Sampling rate: {sr}, Duration: {len(audio)/sr:.2f}s, Mean: {np.mean(audio):.4f}, Std: {np.std(audio):.4f}")
+        # Transcribe audio
+        transcription = transcribe_audio(audio_file)
+        if "Error transcribing" in transcription:
+            return transcription
+        # Analyze symptoms
+        prediction, score = analyze_symptoms(transcription)
+        if "Error analyzing" in prediction:
+            return prediction
+        # Generate feedback
+        if prediction == "No health condition predicted":
             feedback = "No significant health indicators detected."
+        else:
+            feedback = f"Possible health condition: {prediction} (confidence: {score:.4f}). Consult a doctor."
+        feedback += f"\n\n**Debug Info**: Transcription = '{transcription}', Prediction = {prediction}, Confidence = {score:.4f}, File Hash = {file_hash}"
+        feedback += "\n**Disclaimer**: This is not a diagnostic tool. Consult a healthcare provider for medical advice."
         # Store in Salesforce
         if sf:
+            store_in_salesforce(audio_file, feedback, transcription, prediction, score)
+        # Clean up temporary audio file
+        try:
+            os.remove(audio_file)
+            print(f"Deleted temporary audio file: {audio_file}")
+        except Exception as e:
+            print(f"Failed to delete audio file: {str(e)}")
         return feedback
     except Exception as e:
         return f"Error processing audio: {str(e)}"
+def store_in_salesforce(audio_file, feedback, transcription, prediction, score):
     """Store analysis results in Salesforce."""
     try:
         sf.HealthAssessment__c.create({
             "AssessmentDate__c": datetime.utcnow().isoformat(),
             "Feedback__c": feedback,
+            "Transcription__c": transcription,
+            "Prediction__c": prediction,
+            "Confidence__c": float(score),
             "AudioFileName__c": os.path.basename(audio_file)
         })
     except Exception as e:
 def test_with_sample_audio():
     """Test the app with a sample audio file."""
+    sample_audio_path = "audio_samples/sample.wav"
     if os.path.exists(sample_audio_path):
         return analyze_voice(sample_audio_path)
     return "Sample audio file not found."
     inputs=gr.Audio(type="filepath", label="Record or Upload Voice"),
     outputs=gr.Textbox(label="Health Assessment Feedback"),
     title="Health Voice Analyzer",
+    description="Record or upload a voice sample describing symptoms for preliminary health assessment. Supports English (transcription), with symptom analysis in English."
 )
 if __name__ == "__main__":
+    print(test_with_sample_audio())
     iface.launch(server_name="0.0.0.0", server_port=7860)