Spaces:

reab5555
/

Multimodal-Behavioral-Anomalies-Detection

Running

App Files Files Community

reab5555 commited on Jul 30, 2024

Commit

51a0b51

verified ·

1 Parent(s): bf0f0e7

Update video_processing.py

Browse files

Files changed (1) hide show

video_processing.py +7 -3

video_processing.py CHANGED Viewed

@@ -10,7 +10,7 @@ from face_analysis import get_face_embedding, cluster_faces, organize_faces_by_p
 from pose_analysis import pose, calculate_posture_score, draw_pose_landmarks
 from voice_analysis import get_speaker_embeddings, align_voice_embeddings, extract_audio_from_video, diarize_speakers
 from anomaly_detection import anomaly_detection
-from visualization import plot_mse, plot_mse_histogram, plot_mse_heatmap, plot_stacked_mse_heatmaps
 from utils import frame_to_timecode
 import pandas as pd
 from facenet_pytorch import MTCNN
@@ -197,6 +197,9 @@ def process_video(video_path, anomaly_threshold, desired_fps, progress=None):
             mse_heatmap_posture = plot_mse_heatmap(mse_posture, "Body Posture MSE Heatmap", df)
             mse_heatmap_voice = plot_mse_heatmap(mse_voice, "Voice MSE Heatmap", df)
             stacked_heatmap = plot_stacked_mse_heatmaps(mse_embeddings, mse_posture, mse_voice, df, "Combined MSE Heatmaps")
             progress(0.95, "Finishing generating graphs")
@@ -205,7 +208,7 @@ def process_video(video_path, anomaly_threshold, desired_fps, progress=None):
             print(f"Error details: {str(e)}")
             import traceback
             traceback.print_exc()
-            return (f"Error in video processing: {str(e)}",) + (None,) * 26
         progress(1.0, "Preparing results")
         results = f"Number of persons detected: {num_clusters}\n\n"
@@ -267,12 +270,13 @@ def process_video(video_path, anomaly_threshold, desired_fps, progress=None):
             mse_heatmap_embeddings,
             mse_heatmap_posture,
             mse_heatmap_voice,
             face_samples["most_frequent"],
             anomaly_faces_embeddings,
             anomaly_frames_posture_images,
             aligned_faces_folder,
             frames_folder,
-            stacked_heatmap,
         )

 from pose_analysis import pose, calculate_posture_score, draw_pose_landmarks
 from voice_analysis import get_speaker_embeddings, align_voice_embeddings, extract_audio_from_video, diarize_speakers
 from anomaly_detection import anomaly_detection
+from visualization import plot_mse, plot_mse_histogram, plot_mse_heatmap, plot_audio_waveform, plot_stacked_mse_heatmaps
 from utils import frame_to_timecode
 import pandas as pd
 from facenet_pytorch import MTCNN
             mse_heatmap_posture = plot_mse_heatmap(mse_posture, "Body Posture MSE Heatmap", df)
             mse_heatmap_voice = plot_mse_heatmap(mse_voice, "Voice MSE Heatmap", df)
+            # Create audio waveform plot
+            audio_waveform_plot = plot_audio_waveform(audio_path, "Audio Waveform")
             stacked_heatmap = plot_stacked_mse_heatmaps(mse_embeddings, mse_posture, mse_voice, df, "Combined MSE Heatmaps")
             progress(0.95, "Finishing generating graphs")
             print(f"Error details: {str(e)}")
             import traceback
             traceback.print_exc()
+            return (f"Error in video processing: {str(e)}",) + (None,) * 27
         progress(1.0, "Preparing results")
         results = f"Number of persons detected: {num_clusters}\n\n"
             mse_heatmap_embeddings,
             mse_heatmap_posture,
             mse_heatmap_voice,
+            audio_waveform_plot,
             face_samples["most_frequent"],
             anomaly_faces_embeddings,
             anomaly_frames_posture_images,
             aligned_faces_folder,
             frames_folder,
+            stacked_heatmap
         )