Spaces:

avans06
/

ImgutilsVideoProcessor

Sleeping

App Files Files Community

avans06 commited on May 4

Commit

5262ee3

1 Parent(s): 494735a

Add application file

Browse files

Files changed (5) hide show

.gitignore +3 -0
README.md +186 -4
app.py +1396 -0
requirements.txt +2 -0
webui.bat +73 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,3 @@

+.vs
+venv
+tmp

README.md CHANGED Viewed

@@ -1,14 +1,196 @@
 ---
-title: VideoProcessorDetection
-emoji: 🐠
 colorFrom: indigo
-colorTo: yellow
 sdk: gradio
 sdk_version: 5.29.0
 app_file: app.py
-pinned: false
 license: mit
 short_description: 'Video Processor: Detection, Classification, Analysis'
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: ImgutilsVideoProcessor
+emoji: 🖼️
 colorFrom: indigo
+colorTo: pink
 sdk: gradio
 sdk_version: 5.29.0
 app_file: app.py
+pinned: true
 license: mit
 short_description: 'Video Processor: Detection, Classification, Analysis'
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+---
+# [deepghs/anime_person_detection](https://huggingface.co/deepghs/anime_person_detection)
+|        Model         |  FLOPS  |  Params  |  F1 Score  |  Threshold  |                                                  F1 Plot                                                  |                                                       Confusion                                                        |  Labels  |
+|:--------------------:|:-------:|:--------:|:----------:|:-----------:|:---------------------------------------------------------------------------------------------------------:|:----------------------------------------------------------------------------------------------------------------------:|:--------:|
+| person_detect_v1.2_s |  3.49k  |  11.1M   |    0.86    |    0.295    | [plot](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.2_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.2_s/confusion_matrix.png) | `person` |
+| person_detect_v1.3_s |  3.49k  |  11.1M   |    0.86    |    0.324    | [plot](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.3_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.3_s/confusion_matrix.png) | `person` |
+|  person_detect_v0_x  |  31.3k  |  68.1M   |    N/A     |     N/A     |                                                    N/A                                                    |                                                          N/A                                                           | `person` |
+|  person_detect_v0_m  |  9.53k  |  25.8M   |    0.85    |    0.424    |  [plot](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v0_m/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v0_m/confusion_matrix.png)  | `person` |
+|  person_detect_v0_s  |  3.49k  |  11.1M   |    N/A     |     N/A     |                                                    N/A                                                    |                                                          N/A                                                           | `person` |
+| person_detect_v1.1_s |  3.49k  |  11.1M   |    0.86    |    0.384    | [plot](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.1_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.1_s/confusion_matrix.png) | `person` |
+| person_detect_v1.1_n |   898   |  3.01M   |    0.85    |    0.327    | [plot](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.1_n/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.1_n/confusion_matrix.png) | `person` |
+| person_detect_v1.1_m |  9.53k  |  25.8M   |    0.87    |    0.348    | [plot](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.1_m/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1.1_m/confusion_matrix.png) | `person` |
+|  person_detect_v1_m  |  9.53k  |  25.8M   |    0.86    |    0.351    |  [plot](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1_m/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_person_detection/blob/main/person_detect_v1_m/confusion_matrix.png)  | `person` |
+___
+# [deepghs/anime_halfbody_detection](https://huggingface.co/deepghs/anime_halfbody_detection)
+|         Model          |  FLOPS  |  Params  |  F1 Score  |  Threshold  |                                                    F1 Plot                                                    |                                                         Confusion                                                          |   Labels   |
+|:----------------------:|:-------:|:--------:|:----------:|:-----------:|:-------------------------------------------------------------------------------------------------------------:|:--------------------------------------------------------------------------------------------------------------------------:|:----------:|
+| halfbody_detect_v1.0_n |   898   |  3.01M   |    0.94    |    0.512    | [plot](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v1.0_n/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v1.0_n/confusion_matrix.png) | `halfbody` |
+| halfbody_detect_v1.0_s |  3.49k  |  11.1M   |    0.95    |    0.577    | [plot](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v1.0_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v1.0_s/confusion_matrix.png) | `halfbody` |
+| halfbody_detect_v0.4_s |  3.49k  |  11.1M   |    0.93    |    0.517    | [plot](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v0.4_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v0.4_s/confusion_matrix.png) | `halfbody` |
+| halfbody_detect_v0.3_s |  3.49k  |  11.1M   |    0.92    |    0.222    | [plot](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v0.3_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v0.3_s/confusion_matrix.png) | `halfbody` |
+| halfbody_detect_v0.2_s |  3.49k  |  11.1M   |    0.94    |    0.548    | [plot](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v0.2_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_halfbody_detection/blob/main/halfbody_detect_v0.2_s/confusion_matrix.png) | `halfbody` |
+___
+# [deepghs/anime_head_detection](https://huggingface.co/deepghs/anime_head_detection)
+|           Model           |  Type  |  FLOPS  |  Params  |  F1 Score  |  Threshold  |  precision(B)  |  recall(B)  |  mAP50(B)  |  mAP50-95(B)  |                                                   F1 Plot                                                    |                                                              Confusion                                                               |  Labels  |
+|:-------------------------:|:------:|:-------:|:--------:|:----------:|:-----------:|:--------------:|:-----------:|:----------:|:-------------:|:------------------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------------------------:|:--------:|
+|  head_detect_v2.0_x_yv11  |  yolo  |  195G   |  56.9M   |    0.93    |    0.458    |    0.95942     |   0.90938   |  0.96853   |    0.78938    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_x_yv11/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_x_yv11/confusion_matrix_normalized.png)  |  `head`  |
+|  head_detect_v2.0_l_yv11  |  yolo  |  87.3G  |  25.3M   |    0.93    |    0.432    |    0.95557     |   0.90905   |   0.9661   |    0.78709    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_l_yv11/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_l_yv11/confusion_matrix_normalized.png)  |  `head`  |
+|  head_detect_v2.0_m_yv11  |  yolo  |  68.2G  |  20.1M   |    0.93    |    0.42     |    0.95383     |   0.90658   |  0.96485   |    0.78511    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_m_yv11/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_m_yv11/confusion_matrix_normalized.png)  |  `head`  |
+|  head_detect_v2.0_s_yv11  |  yolo  |  21.5G  |  9.43M   |    0.92    |    0.383    |     0.954      |   0.89512   |  0.95789   |    0.77753    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_s_yv11/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_s_yv11/confusion_matrix_normalized.png)  |  `head`  |
+|  head_detect_v2.0_n_yv11  |  yolo  |  6.44G  |  2.59M   |    0.91    |    0.365    |    0.94815     |   0.87169   |   0.9452   |    0.75835    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_n_yv11/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_n_yv11/confusion_matrix_normalized.png)  |  `head`  |
+|    head_detect_v2.0_x     |  yolo  |  227G   |  61.6M   |    0.93    |    0.459    |    0.95378     |   0.91123   |  0.96593   |    0.78767    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_x/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_x/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v2.0_l     |  yolo  |  146G   |  39.5M   |    0.93    |    0.379    |    0.95124     |   0.91264   |  0.96458   |    0.78627    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_l/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_l/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v2.0_m     |  yolo  |  79.1G  |  25.9M   |    0.93    |    0.397    |    0.95123     |   0.90701   |  0.96403   |    0.78342    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_m/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_m/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v2.0_s     |  yolo  |  28.6G  |  11.1M   |    0.92    |    0.413    |    0.95556     |   0.89197   |  0.95799   |    0.77833    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v2.0_n     |  yolo  |  8.19G  |  3.01M   |    0.91    |    0.368    |    0.94633     |   0.87046   |  0.94361   |    0.75764    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v2.0_n/confusion_matrix_normalized.png)     |  `head`  |
+| head_detect_v1.6_x_rtdetr | rtdetr |  232G   |  67.3M   |    0.93    |    0.559    |    0.95316     |   0.91697   |  0.96556   |    0.76682    | [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_x_rtdetr/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_x_rtdetr/confusion_matrix_normalized.png) |  `head`  |
+| head_detect_v1.6_l_rtdetr | rtdetr |  108G   |  32.8M   |    0.93    |    0.53     |    0.95113     |   0.90956   |  0.96218   |    0.76201    | [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_l_rtdetr/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_l_rtdetr/confusion_matrix_normalized.png) |  `head`  |
+|  head_detect_v1.6_s_yv11  |  yolo  |  21.5G  |  9.43M   |    0.93    |    0.42     |    0.95273     |   0.90558   |  0.96327   |    0.78566    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s_yv11/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s_yv11/confusion_matrix_normalized.png)  |  `head`  |
+|  head_detect_v1.6_n_yv11  |  yolo  |  6.44G  |  2.59M   |    0.92    |    0.385    |    0.95561     |   0.87798   |  0.95086   |    0.76765    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_n_yv11/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_n_yv11/confusion_matrix_normalized.png)  |  `head`  |
+|  head_detect_v1.6_s_yv9   |  yolo  |  22.7G  |  6.32M   |    0.93    |    0.419    |    0.95464     |   0.90425   |   0.9627   |    0.78663    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s_yv9/F1_curve.png)   |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s_yv9/confusion_matrix_normalized.png)   |  `head`  |
+|  head_detect_v1.6_t_yv9   |  yolo  |  6.7G   |  1.77M   |    0.91    |    0.332    |    0.94968     |   0.8792    |  0.95069   |    0.76789    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_t_yv9/F1_curve.png)   |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_t_yv9/confusion_matrix_normalized.png)   |  `head`  |
+|    head_detect_v1.6_x     |  yolo  |  258G   |  68.2M   |    0.94    |    0.448    |     0.9546     |   0.91873   |  0.96878   |    0.79502    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_x/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_x/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.6_l     |  yolo  |  165G   |  43.6M   |    0.94    |    0.458    |    0.95733     |   0.92018   |  0.96868   |    0.79428    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_l/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_l/confusion_matrix_normalized.png)     |  `head`  |
+|  head_detect_v1.6_s_yv10  |  yolo  |  24.8G  |  8.07M   |    0.93    |    0.406    |    0.95424     |   0.90074   |  0.96201   |    0.78713    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s_yv10/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s_yv10/confusion_matrix_normalized.png)  |  `head`  |
+|  head_detect_v1.6_n_yv10  |  yolo  |  8.39G  |  2.71M   |    0.91    |    0.374    |    0.94845     |   0.87492   |   0.9503   |    0.77059    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_n_yv10/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_n_yv10/confusion_matrix_normalized.png)  |  `head`  |
+|    head_detect_v1.6_s     |  yolo  |  28.6G  |  11.1M   |    0.93    |    0.381    |    0.95333     |   0.90587   |  0.96241   |    0.78688    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.6_n     |  yolo  |  8.19G  |  3.01M   |    0.92    |    0.38     |    0.94835     |   0.88436   |  0.95051   |    0.76766    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.6_n/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.5_s     |  yolo  |  28.6G  |  11.1M   |    0.94    |    0.453    |    0.96014     |   0.92275   |  0.96829   |    0.80674    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.5_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.5_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.5_n     |  yolo  |  8.19G  |  3.01M   |    0.93    |    0.396    |    0.95719     |   0.90511   |   0.9612   |    0.78841    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.5_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.5_n/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.4_s     |  yolo  |  28.6G  |  11.1M   |    0.94    |    0.472    |    0.96275     |   0.91875   |  0.96812   |    0.80417    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.4_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.4_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.4_n     |  yolo  |  8.19G  |  3.01M   |    0.93    |    0.396    |     0.9557     |   0.90559   |  0.96075   |    0.78689    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.4_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.4_n/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.3_s     |  yolo  |  28.6G  |  11.1M   |    0.94    |    0.423    |    0.95734     |   0.9257    |  0.97037   |    0.80391    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.3_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.3_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.3_n     |  yolo  |  8.19G  |  3.01M   |    0.93    |    0.409    |    0.95254     |   0.90674   |  0.96258   |    0.7844     |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.3_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.3_n/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.2_s     |  yolo  |  28.6G  |  11.1M   |    0.94    |    0.415    |    0.95756     |   0.9271    |  0.97097   |    0.80514    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.2_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.2_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.2_n     |  yolo  |  8.19G  |  3.01M   |    0.93    |    0.471    |    0.96309     |   0.89766   |   0.9647   |    0.78928    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.2_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.2_n/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.1_s     |  yolo  |  28.6G  |  11.1M   |    0.94    |    0.485    |    0.96191     |   0.91892   |  0.97069   |    0.80182    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.1_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.1_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.0_l     |  yolo  |  165G   |  43.6M   |    0.94    |    0.579    |    0.95881     |   0.91532   |  0.96561   |    0.81417    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_l/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_l/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.0_x     |  yolo  |  258G   |  68.2M   |    0.94    |    0.567    |     0.9597     |   0.91947   |  0.96682   |    0.8154     |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_x/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_x/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.0_m     |  yolo  |  79.1G  |  25.9M   |    0.94    |    0.489    |    0.95805     |   0.9196    |  0.96632   |    0.81383    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_m/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_m/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.0_s     |  yolo  |  28.6G  |  11.1M   |    0.93    |    0.492    |    0.95267     |   0.91355   |  0.96245   |    0.80371    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v1.0_n     |  yolo  |  8.19G  |  3.01M   |    0.92    |    0.375    |    0.93999     |   0.9002    |  0.95509   |    0.7849     |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v1.0_n/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v0.5_s     |  yolo  |  28.6G  |  11.1M   |    0.92    |    0.415    |    0.93908     |   0.9034    |  0.95697   |    0.77514    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v0.5_n     |  yolo  |  8.19G  |  3.01M   |    0.91    |    0.446    |    0.93834     |   0.88034   |  0.94784   |    0.75251    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_n/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_n/confusion_matrix_normalized.png)     |  `head`  |
+| head_detect_v0.5_s_pruned |  yolo  |  28.6G  |  11.1M   |    0.93    |    0.472    |    0.95455     |   0.89865   |   0.9584   |    0.79968    | [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_s_pruned/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_s_pruned/confusion_matrix_normalized.png) |  `head`  |
+| head_detect_v0.5_n_pruned |  yolo  |  8.19G  |  3.01M   |    0.91    |    0.523    |    0.95254     |   0.8743    |  0.95049   |    0.7807     | [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_n_pruned/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_n_pruned/confusion_matrix_normalized.png) |  `head`  |
+| head_detect_v0.5_m_pruned |  yolo  |  79.1G  |  25.9M   |    0.94    |    0.52     |     0.9609     |   0.91365   |  0.96501   |    0.81322    | [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_m_pruned/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.5_m_pruned/confusion_matrix_normalized.png) |  `head`  |
+|    head_detect_v0.4_s     |  yolo  |  28.6G  |  11.1M   |    0.92    |    0.405    |    0.93314     |   0.90274   |  0.95727   |    0.77193    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.4_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.4_s/confusion_matrix_normalized.png)     |  `head`  |
+|   head_detect_v0.4_s_fp   |  yolo  |  28.6G  |  11.1M   |    0.91    |    0.445    |    0.93181     |   0.89113   |  0.95002   |    0.76302    |   [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.4_s_fp/F1_curve.png)   |   [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.4_s_fp/confusion_matrix_normalized.png)   |  `head`  |
+|    head_detect_v0.3_s     |  yolo  |  28.6G  |  11.1M   |    0.91    |    0.406    |    0.92457     |   0.90351   |  0.95785   |    0.78912    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.3_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.3_s/confusion_matrix_normalized.png)     |  `head`  |
+|  head_detect_v0.2_s_plus  |  yolo  |  28.6G  |  11.1M   |    0.91    |    0.594    |    0.94239     |   0.8774    |  0.94909   |    0.77986    |  [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.2_s_plus/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.2_s_plus/confusion_matrix_normalized.png)  |  `head`  |
+|    head_detect_v0.2_s     |  yolo  |  28.6G  |  11.1M   |    0.9     |    0.461    |    0.91861     |   0.8898    |  0.94765   |    0.77541    |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.2_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.2_s/confusion_matrix_normalized.png)     |  `head`  |
+|    head_detect_v0.1_s     |  yolo  |  28.6G  |  11.1M   |    0.9     |    0.504    |    0.91576     |   0.88662   |  0.94213   |    0.7713     |    [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.1_s/F1_curve.png)     |    [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0.1_s/confusion_matrix_normalized.png)     |  `head`  |
+|     head_detect_v0_n      |  yolo  |  8.19G  |  3.01M   |    0.9     |    0.316    |      N/A       |     N/A     |    N/A     |      N/A      |     [plot](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0_n/F1_curve.png)      |           [confusion](https://huggingface.co/deepghs/anime_head_detection/blob/main/head_detect_v0_n/confusion_matrix.png)           |  `head`  |
+|     head_detect_v0_s      |  yolo  |  28.6G  |  11.1M   |    N/A     |     N/A     |      N/A       |     N/A     |    N/A     |      N/A      |                                                     N/A                                                      |                                                                 N/A                                                                  |  `head`  |
+___
+# [deepghs/ccip](https://huggingface.co/deepghs/ccip)
+|                Model                |  F1 Score  |  Precision  |  Recall  |  Threshold  |  Cluster_2  |  Cluster_Free  |
+|:-----------------------------------:|:----------:|:-----------:|:--------:|:-----------:|:-----------:|:--------------:|
+|        ccip-caformer_b36-24         |  0.940925  |  0.938254   | 0.943612 |  0.213231   |   0.89508   |    0.957017    |
+|   ccip-caformer-24-randaug-pruned   |  0.917211  |  0.933481   | 0.901499 |  0.178475   |  0.890366   |    0.922375    |
+|       ccip-v2-caformer_s36-10       |  0.906422  |  0.932779   | 0.881513 |  0.207757   |  0.874592   |    0.89241     |
+| ccip-caformer-6-randaug-pruned_fp32 |  0.878403  |  0.893648   | 0.863669 |  0.195122   |  0.810176   |    0.897904    |
+|        ccip-caformer-5_fp32         |  0.864363  |   0.90155   | 0.830121 |  0.183973   |  0.792051   |    0.862289    |
+|        ccip-caformer-4_fp32         |  0.844967  |  0.870553   | 0.820842 |   0.18367   |  0.795565   |    0.868133    |
+|       ccip-caformer_query-12        |  0.823928  |  0.871122   | 0.781585 |  0.141308   |  0.787237   |    0.809426    |
+|    ccip-caformer-23_randaug_fp32    |  0.81625   |  0.854134   | 0.781585 |  0.136797   |  0.745697   |     0.8068     |
+| ccip-caformer-2-randaug-pruned_fp32 |  0.78561   |  0.800148   | 0.771592 |  0.171053   |  0.686617   |    0.728195    |
+|        ccip-caformer-2_fp32         |  0.755125  |  0.790172   | 0.723055 |  0.141275   |   0.64977   |    0.718516    |
+* The calculation of `F1 Score`, `Precision`, and `Recall` considers "the characters in both images are the same" as a positive case. `Threshold` is determined by finding the maximum value on the F1 Score curve.
+* `Cluster_2` represents the approximate optimal clustering solution obtained by tuning the eps value in DBSCAN clustering algorithm with min_samples set to `2`, and evaluating the similarity between the obtained clusters and the true distribution using the `random_adjust_score`.
+* `Cluster_Free` represents the approximate optimal solution obtained by tuning the `max_eps` and `min_samples` values in the OPTICS clustering algorithm, and evaluating the similarity between the obtained clusters and the true distribution using the `random_adjust_score`.
+___
+# [deepghs/anime_aesthetic](https://huggingface.co/spaces/deepghs/anime_aesthetic)
+|           Name           |  FLOPS  |  Params  |  Accuracy  |  AUC   |                                                     Confusion                                                     |                              Labels                              |
+|:------------------------:|:-------:|:--------:|:----------:|:------:|:-----------------------------------------------------------------------------------------------------------------:|:----------------------------------------------------------------:|
+|  caformer_s36_v0_ls0.2   | 22.10G  |  37.22M  |   34.68%   | 0.7725 |  [confusion](https://huggingface.co/deepghs/anime_aesthetic/blob/main/caformer_s36_v0_ls0.2/plot_confusion.png)   | `masterpiece`, `best`, `great`, `good`, `normal`, `low`, `worst` |
+|  swinv2pv3_v0_448_ls0.2  | 46.20G  |  65.94M  |   40.32%   | 0.8188 |  [confusion](https://huggingface.co/deepghs/anime_aesthetic/blob/main/swinv2pv3_v0_448_ls0.2/plot_confusion.png)  | `masterpiece`, `best`, `great`, `good`, `normal`, `low`, `worst` |
+| swinv2pv3_v0_448_ls0.2_x | 46.20G  |  65.94M  |   40.88%   | 0.8214 | [confusion](https://huggingface.co/deepghs/anime_aesthetic/blob/main/swinv2pv3_v0_448_ls0.2_x/plot_confusion.png) | `masterpiece`, `best`, `great`, `good`, `normal`, `low`, `worst` |
+___
+# [deepghs/anime_face_detection](https://huggingface.co/deepghs/anime_face_detection)
+|       Model        |  FLOPS  |  Params  |  F1 Score  |  Threshold  |                                                F1 Plot                                                |                                                     Confusion                                                      |  Labels  |
+|:------------------:|:-------:|:--------:|:----------:|:-----------:|:-----------------------------------------------------------------------------------------------------:|:------------------------------------------------------------------------------------------------------------------:|:--------:|
+| face_detect_v1.4_n |   898   |  3.01M   |    0.94    |    0.278    | [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.4_n/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.4_n/confusion_matrix.png) |  `face`  |
+| face_detect_v1.4_s |  3.49k  |  11.1M   |    0.95    |    0.307    | [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.4_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.4_s/confusion_matrix.png) |  `face`  |
+| face_detect_v1.3_n |   898   |  3.01M   |    0.93    |    0.305    | [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.3_n/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.3_n/confusion_matrix.png) |  `face`  |
+| face_detect_v1.2_s |  3.49k  |  11.1M   |    0.93    |    0.222    | [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.2_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.2_s/confusion_matrix.png) |  `face`  |
+| face_detect_v1.3_s |  3.49k  |  11.1M   |    0.93    |    0.259    | [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.3_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.3_s/confusion_matrix.png) |  `face`  |
+|  face_detect_v1_s  |  3.49k  |  11.1M   |    0.95    |    0.446    |  [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1_s/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1_s/confusion_matrix.png)  |  `face`  |
+|  face_detect_v1_n  |   898   |  3.01M   |    0.95    |    0.458    |  [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1_n/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1_n/confusion_matrix.png)  |  `face`  |
+|  face_detect_v0_n  |   898   |  3.01M   |    0.97    |    0.428    |  [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v0_n/F1_curve.png)  |  [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v0_n/confusion_matrix.png)  |  `face`  |
+|  face_detect_v0_s  |  3.49k  |  11.1M   |    N/A     |     N/A     |                                                  N/A                                                  |                                                        N/A                                                         |  `face`  |
+| face_detect_v1.1_n |   898   |  3.01M   |    0.94    |    0.373    | [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.1_n/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.1_n/confusion_matrix.png) |  `face`  |
+| face_detect_v1.1_s |  3.49k  |  11.1M   |    0.94    |    0.405    | [plot](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.1_s/F1_curve.png) | [confusion](https://huggingface.co/deepghs/anime_face_detection/blob/main/face_detect_v1.1_s/confusion_matrix.png) |  `face`  |
+___
+# [deepghs/real_person_detection](https://huggingface.co/deepghs/real_person_detection)
+|          Model          |  Type  |  FLOPS  |  Params  |  F1 Score  |  Threshold  |  precision(B)  |  recall(B)  |  mAP50(B)  |  mAP50-95(B)  |                                                   F1 Plot                                                   |                                                              Confusion                                                              |  Labels  |
+|:-----------------------:|:------:|:-------:|:--------:|:----------:|:-----------:|:--------------:|:-----------:|:----------:|:-------------:|:-----------------------------------------------------------------------------------------------------------:|:-----------------------------------------------------------------------------------------------------------------------------------:|:--------:|
+| person_detect_v0_l_yv11 |  yolo  |  87.3G  |  25.3M   |    0.79    |    0.359    |    0.84037     |   0.74055   |  0.82796   |    0.57272    | [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_l_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_l_yv11/confusion_matrix_normalized.png) | `person` |
+| person_detect_v0_m_yv11 |  yolo  |  68.2G  |  20.1M   |    0.78    |    0.351    |    0.83393     |   0.73614   |  0.82195   |    0.56267    | [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_m_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_m_yv11/confusion_matrix_normalized.png) | `person` |
+| person_detect_v0_s_yv11 |  yolo  |  21.5G  |  9.43M   |    0.75    |    0.344    |    0.82356     |   0.6967    |  0.79224   |    0.52304    | [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_s_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_s_yv11/confusion_matrix_normalized.png) | `person` |
+| person_detect_v0_n_yv11 |  yolo  |  6.44G  |  2.59M   |    0.71    |    0.325    |    0.80096     |   0.64148   |  0.74612   |    0.46875    | [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_n_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_n_yv11/confusion_matrix_normalized.png) | `person` |
+|   person_detect_v0_l    |  yolo  |  165G   |  43.6M   |    0.79    |    0.359    |    0.83674     |   0.74182   |  0.82536   |    0.57022    |   [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_l/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_l/confusion_matrix_normalized.png)    | `person` |
+|   person_detect_v0_m    |  yolo  |  79.1G  |  25.9M   |    0.78    |    0.363    |    0.83439     |   0.72529   |  0.81314   |    0.55388    |   [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_m/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_m/confusion_matrix_normalized.png)    | `person` |
+|   person_detect_v0_s    |  yolo  |  28.6G  |  11.1M   |    0.76    |    0.346    |    0.82522     |   0.69696   |  0.79105   |    0.52201    |   [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_s/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_s/confusion_matrix_normalized.png)    | `person` |
+|   person_detect_v0_n    |  yolo  |  8.19G  |  3.01M   |    0.72    |    0.32     |    0.80883     |   0.64552   |  0.74996   |    0.47272    |   [plot](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_n/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_person_detection/blob/main/person_detect_v0_n/confusion_matrix_normalized.png)    | `person` |
+___
+# [deepghs/real_head_detection](https://huggingface.co/deepghs/real_head_detection)
+|         Model         |  Type  |  FLOPS  |  Params  |  F1 Score  |  Threshold  |  precision(B)  |  recall(B)  |  mAP50(B)  |  mAP50-95(B)  |                                                 F1 Plot                                                 |                                                            Confusion                                                            |  Labels  |
+|:---------------------:|:------:|:-------:|:--------:|:----------:|:-----------:|:--------------:|:-----------:|:----------:|:-------------:|:-------------------------------------------------------------------------------------------------------:|:-------------------------------------------------------------------------------------------------------------------------------:|:--------:|
+| head_detect_v0_l_yv11 |  yolo  |  87.3G  |  25.3M   |    0.81    |    0.199    |    0.90226     |   0.72872   |  0.81049   |    0.5109     | [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_l_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_l_yv11/confusion_matrix_normalized.png) |  `head`  |
+| head_detect_v0_m_yv11 |  yolo  |  68.2G  |  20.1M   |    0.8     |    0.206    |    0.89855     |   0.72654   |  0.80704   |    0.50804    | [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_m_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_m_yv11/confusion_matrix_normalized.png) |  `head`  |
+| head_detect_v0_s_yv11 |  yolo  |  21.5G  |  9.43M   |    0.78    |    0.187    |    0.88726     |   0.69234   |  0.77518   |    0.47825    | [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_s_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_s_yv11/confusion_matrix_normalized.png) |  `head`  |
+| head_detect_v0_n_yv11 |  yolo  |  6.44G  |  2.59M   |    0.74    |    0.14     |    0.87359     |   0.64011   |  0.73393   |    0.44118    | [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_n_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_n_yv11/confusion_matrix_normalized.png) |  `head`  |
+|   head_detect_v0_l    |  yolo  |  165G   |  43.6M   |    0.81    |    0.234    |    0.89921     |   0.74092   |  0.81715   |    0.51615    |   [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_l/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_l/confusion_matrix_normalized.png)    |  `head`  |
+|   head_detect_v0_m    |  yolo  |  79.1G  |  25.9M   |    0.8     |    0.228    |    0.90006     |   0.72646   |  0.80614   |    0.50586    |   [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_m/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_m/confusion_matrix_normalized.png)    |  `head`  |
+|   head_detect_v0_s    |  yolo  |  28.6G  |  11.1M   |    0.78    |    0.182    |    0.89224     |   0.69382   |  0.77804   |    0.48067    |   [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_s/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_s/confusion_matrix_normalized.png)    |  `head`  |
+|   head_detect_v0_n    |  yolo  |  8.19G  |  3.01M   |    0.74    |    0.172    |     0.8728     |   0.64823   |  0.73865   |    0.44501    |   [plot](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_n/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_head_detection/blob/main/head_detect_v0_n/confusion_matrix_normalized.png)    |  `head`  |
+___
+# [deepghs/real_face_detection](https://huggingface.co/deepghs/real_face_detection)
+|         Model         |  Type  |  FLOPS  |  Params  |  F1 Score  |  Threshold  |  precision(B)  |  recall(B)  |  mAP50(B)  |  mAP50-95(B)  |                                                 F1 Plot                                                 |                                                            Confusion                                                            |  Labels  |
+|:---------------------:|:------:|:-------:|:--------:|:----------:|:-----------:|:--------------:|:-----------:|:----------:|:-------------:|:-------------------------------------------------------------------------------------------------------:|:-------------------------------------------------------------------------------------------------------------------------------:|:--------:|
+| face_detect_v0_s_yv12 |  yolo  |  21.5G  |  9.25M   |    0.74    |    0.272    |    0.86931     |   0.6404    |  0.73074   |    0.42652    | [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_s_yv12/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_s_yv12/confusion_matrix_normalized.png) |  `face`  |
+| face_detect_v0_n_yv12 |  yolo  |  6.48G  |  2.57M   |    0.7     |    0.258    |    0.85246     |   0.59089   |   0.6793   |    0.39182    | [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_n_yv12/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_n_yv12/confusion_matrix_normalized.png) |  `face`  |
+| face_detect_v0_l_yv11 |  yolo  |  87.3G  |  25.3M   |    0.77    |    0.291    |    0.88458     |   0.67474   |  0.76666   |    0.45722    | [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_l_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_l_yv11/confusion_matrix_normalized.png) |  `face`  |
+| face_detect_v0_m_yv11 |  yolo  |  68.2G  |  20.1M   |    0.76    |    0.262    |    0.87947     |   0.67315   |  0.76073   |    0.45288    | [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_m_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_m_yv11/confusion_matrix_normalized.png) |  `face`  |
+| face_detect_v0_s_yv11 |  yolo  |  21.5G  |  9.43M   |    0.73    |    0.271    |    0.87001     |   0.63572   |  0.72683   |    0.42706    | [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_s_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_s_yv11/confusion_matrix_normalized.png) |  `face`  |
+| face_detect_v0_n_yv11 |  yolo  |  6.44G  |  2.59M   |    0.7     |    0.263    |    0.86044     |   0.58577   |  0.67641   |    0.38975    | [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_n_yv11/F1_curve.png) | [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_n_yv11/confusion_matrix_normalized.png) |  `face`  |
+|   face_detect_v0_l    |  yolo  |  165G   |  43.6M   |    0.76    |    0.277    |    0.87894     |   0.67335   |  0.76313   |    0.4532     |   [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_l/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_l/confusion_matrix_normalized.png)    |  `face`  |
+|   face_detect_v0_m    |  yolo  |  79.1G  |  25.9M   |    0.75    |    0.277    |    0.87687     |   0.66265   |  0.75114   |    0.44262    |   [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_m/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_m/confusion_matrix_normalized.png)    |  `face`  |
+|   face_detect_v0_s    |  yolo  |  28.6G  |  11.1M   |    0.73    |    0.282    |    0.86932     |   0.63557   |  0.72494   |    0.42219    |   [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_s/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_s/confusion_matrix_normalized.png)    |  `face`  |
+|   face_detect_v0_n    |  yolo  |  8.19G  |  3.01M   |    0.7     |    0.257    |    0.85337     |   0.58877   |  0.67471   |    0.38692    |   [plot](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_n/F1_curve.png)    |   [confusion](https://huggingface.co/deepghs/real_face_detection/blob/main/face_detect_v0_n/confusion_matrix_normalized.png)    |  `face`  |
+___

app.py ADDED Viewed

	@@ -0,0 +1,1396 @@

+import io
+import os
+import gc
+import re
+import cv2
+import time
+import zipfile
+import tempfile
+import traceback
+import numpy as np
+import gradio as gr
+import imgutils.detect.person as person_detector
+import imgutils.detect.halfbody as halfbody_detector
+import imgutils.detect.head as head_detector
+import imgutils.detect.face as face_detector
+import imgutils.metrics.ccip as ccip_analyzer
+import imgutils.metrics.dbaesthetic as dbaesthetic_analyzer
+import imgutils.metrics.lpips as lpips_module
+from PIL import Image
+from typing import List, Tuple, Dict, Any, Union, Optional, Iterator
+# --- Constants for File Types ---
+IMAGE_EXTENSIONS = ('.png', '.jpg', '.jpeg', '.webp', '.bmp', '.tiff', '.tif', '.gif')
+VIDEO_EXTENSIONS = ('.mp4', '.avi', '.mov', '.mkv', '.flv', '.webm', '.mpeg', '.mpg')
+# --- Helper Functions ---
+def sanitize_filename(filename: str, max_len: int = 50) -> str:
+    """Removes invalid characters and shortens a filename for safe use."""
+    # Remove path components
+    base_name = os.path.basename(filename)
+    # Remove extension
+    name_part, _ = os.path.splitext(base_name)
+    # Replace spaces and problematic characters with underscores
+    sanitized = re.sub(r'[\\/*?:"<>|\s]+', '_', name_part)
+    # Remove leading/trailing underscores/periods
+    sanitized = sanitized.strip('._')
+    # Limit length (important for temp paths and OS limits)
+    sanitized = sanitized[:max_len]
+    # Ensure it's not empty after sanitization
+    if not sanitized:
+        return "file"
+    return sanitized
+def convert_to_pil(frame: np.ndarray) -> Image.Image:
+    """Converts an OpenCV frame (BGR) to a PIL Image (RGB)."""
+    # Add error handling for potentially empty frames
+    if frame is None or frame.size == 0:
+        raise ValueError("Cannot convert empty frame to PIL Image")
+    try:
+        return Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
+    except Exception as e:
+        # Re-raise with more context if conversion fails
+        raise RuntimeError(f"Failed to convert frame to PIL Image: {e}")
+def image_to_bytes(img: Image.Image, format: str = 'PNG') -> bytes:
+    """Converts a PIL Image to bytes."""
+    if img is None:
+        raise ValueError("Cannot convert None image to bytes")
+    byte_arr = io.BytesIO()
+    img.save(byte_arr, format=format)
+    return byte_arr.getvalue()
+def create_zip_file(image_data: Dict[str, bytes], output_path: str) -> None:
+    """
+    Creates a zip file containing the provided images directly at the output_path.
+    Args:
+        image_data: A dictionary where keys are filenames (including paths within zip)
+                    and values are image bytes.
+        output_path: The full path where the zip file should be created.
+    """
+    if not image_data:
+        raise ValueError("No image data provided to create zip file.")
+    if not output_path:
+        raise ValueError("No output path provided for the zip file.")
+    print(f"Creating zip file at: {output_path}")
+    try:
+        # Ensure parent directory exists (useful if output_path is nested)
+        # Though NamedTemporaryFile usually handles this for its own path.
+        parent_dir = os.path.dirname(output_path)
+        if parent_dir: # Check if there is a parent directory component
+            os.makedirs(parent_dir, exist_ok=True)
+        with zipfile.ZipFile(output_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
+            # Sort items for potentially better organization and predictability
+            for filename, img_bytes in sorted(image_data.items()):
+                zipf.writestr(filename, img_bytes)
+        print(f"Successfully created zip file with {len(image_data)} items at {output_path}.")
+        # No return value needed as we are writing to a path
+    except Exception as e:
+        print(f"Error creating zip file at {output_path}: {e}")
+        # If zip creation fails, attempt to remove the partially created file
+        if os.path.exists(output_path):
+            try:
+                os.remove(output_path)
+                print(f"Removed partially created/failed zip file: {output_path}")
+            except OSError as remove_err:
+                print(f"Warning: Could not remove failed zip file {output_path}: {remove_err}")
+        raise # Re-raise the original exception
+def generate_filename(
+    base_name: str, # Should be the core identifier, e.g., "frame_X_person_Y_scoreZ"
+    aesthetic_label: Optional[str] = None,
+    ccip_cluster_id_for_lpips_logic: Optional[int] = None, # Original CCIP ID, used to decide if LPIPS is sub-cluster
+    ccip_folder_naming_index: Optional[int] = None,      # The new 000, 001, ... index based on image count
+    source_prefix_for_ccip_folder: Optional[str] = None,  # The source filename prefix for CCIP folder
+    lpips_folder_naming_index: Optional[Union[int, str]] = None, # New: Can be int (0,1,2...) or "noise"
+    file_extension: str = '.png',
+    # Suffix flags for this specific image:
+    is_halfbody_primary_target_type: bool = False, # If this image itself was a halfbody primary target
+    is_derived_head_crop: bool = False,
+    is_derived_face_crop: bool = False,
+) -> str:
+    """
+    Generates the final filename, incorporating aesthetic label, cluster directory,
+    and crop indicators. CCIP and LPIPS folder names are sorted by image count.
+    """
+    filename_stem = base_name
+    # Add suffixes for derived crops.
+    # For halfbody primary targets, the base_name should already contain "halfbody".
+    # This flag is more for potentially adding a suffix if desired, but currently not used to add a suffix.
+    # if is_halfbody_primary_target_type:
+    #     filename_stem += "_halfbody" # Potentially redundant if base_name good.
+    if is_derived_head_crop:
+        filename_stem += "_headCrop"
+    if is_derived_face_crop:
+        filename_stem += "_faceCrop"
+    filename_with_extension = filename_stem + file_extension
+    path_parts = []
+    # New CCIP folder naming based on source prefix and sorted index
+    if ccip_folder_naming_index is not None and source_prefix_for_ccip_folder is not None:
+        path_parts.append(f"{source_prefix_for_ccip_folder}_ccip_{ccip_folder_naming_index:03d}")
+    # LPIPS folder naming based on the new sorted index or "noise"
+    if lpips_folder_naming_index is not None:
+        lpips_folder_name_part_str: Optional[str] = None
+        if isinstance(lpips_folder_naming_index, str) and lpips_folder_naming_index == "noise":
+            lpips_folder_name_part_str = "noise"
+        elif isinstance(lpips_folder_naming_index, int):
+            lpips_folder_name_part_str = f"{lpips_folder_naming_index:03d}"
+        if lpips_folder_name_part_str is not None:
+            # Determine prefix based on whether the item was originally in a CCIP cluster
+            if ccip_cluster_id_for_lpips_logic is not None: # LPIPS is sub-cluster if item had an original CCIP ID
+                lpips_folder_name_base = "lpips_sub_"
+            else: # No CCIP, LPIPS is primary
+                lpips_folder_name_base = "lpips_"
+            path_parts.append(f"{lpips_folder_name_base}{lpips_folder_name_part_str}")
+    final_filename_part = filename_with_extension
+    if aesthetic_label:
+        final_filename_part = f"{aesthetic_label}_{filename_with_extension}"
+    if path_parts:
+        return f"{'/'.join(path_parts)}/{final_filename_part}"
+    else:
+        return final_filename_part
+# --- Core Processing Function for a single source (video or image sequence) ---
+def _process_input_source_frames(
+    source_file_prefix: str, # Sanitized name for this source (e.g., "myvideo" or "ImageGroup123")
+    # Iterator yielding: (PIL.Image, frame_identifier_string, current_item_index, total_items_for_desc)
+    # For videos, current_item_index is the 1-based raw frame number.
+    # For images, current_item_index is the 1-based image number in the sequence.
+    frames_provider: Iterator[Tuple[Image.Image, int, int, int]],
+    is_video_source: bool, # To adjust some logging/stats messages
+    # Person Detection
+    enable_person_detection: bool,
+    min_target_width_person_percentage: float,
+    person_model_name: str,
+    person_conf_threshold: float,
+    person_iou_threshold: float,
+    # Half-Body Detection
+    enable_halfbody_detection: bool,
+    enable_halfbody_cropping: bool,
+    min_target_width_halfbody_percentage: float,
+    halfbody_model_name: str,
+    halfbody_conf_threshold: float,
+    halfbody_iou_threshold: float,
+    # Head Detection
+    enable_head_detection: bool,
+    enable_head_cropping: bool,
+    min_crop_width_head_percentage: float,
+    enable_head_filtering: bool,
+    head_model_name: str,
+    head_conf_threshold: float,
+    head_iou_threshold: float,
+    # Face Detection
+    enable_face_detection: bool,
+    enable_face_cropping: bool,
+    min_crop_width_face_percentage: float,
+    enable_face_filtering: bool,
+    face_model_name: str,
+    face_conf_threshold: float,
+    face_iou_threshold: float,
+    # CCIP Classification
+    enable_ccip_classification: bool,
+    ccip_model_name: str,
+    ccip_threshold: float,
+    # LPIPS Clustering
+    enable_lpips_clustering: bool,
+    lpips_threshold: float,
+    # Aesthetic Analysis
+    enable_aesthetic_analysis: bool,
+    aesthetic_model_name: str,
+    # Gradio Progress (specific to this source's processing)
+    progress_updater # Function: (progress_value: float, desc: str) -> None
+) -> Tuple[str | None, str]:
+    """
+    Processes frames from a given source (video or image sequence) according to the specified parameters.
+    Order: Person => Half-Body (alternative) => Face Detection => Head Detection => CCIP => Aesthetic.
+    Returns:
+        A tuple containing:
+        - Path to the output zip file (or None if error).
+        - Status message string.
+    """
+    # This list will hold data for images that pass all filters, BEFORE LPIPS and final zipping
+    images_pending_final_processing: List[Dict[str, Any]] = []
+    # CCIP specific data
+    ccip_clusters_info: List[Tuple[int, np.ndarray]] = []
+    next_ccip_cluster_id = 0
+    # Stats
+    processed_items_count = 0
+    total_persons_detected_raw, total_halfbodies_detected_raw = 0, 0
+    person_targets_processed_count, halfbody_targets_processed_count, fullframe_targets_processed_count = 0, 0, 0
+    total_faces_detected_on_targets, total_heads_detected_on_targets = 0, 0
+    # These count items added to images_pending_final_processing
+    main_targets_pending_count, face_crops_pending_count, head_crops_pending_count = 0, 0, 0
+    items_filtered_by_face_count, items_filtered_by_head_count = 0, 0
+    ccip_applied_count, aesthetic_applied_count = 0, 0
+    # LPIPS stats
+    lpips_images_subject_to_clustering, total_lpips_clusters_created, total_lpips_noise_samples = 0, 0, 0
+    gc_interval = 100 # items from provider
+    start_time = time.time()
+    # Progress update for initializing this specific video
+    progress_updater(0, desc=f"Initializing {source_file_prefix}...")
+    output_zip_path_temp = None
+    output_zip_path_final = None
+    try:
+        # --- Main Loop for processing items from the frames_provider ---
+        for pil_image_full_frame, frame_specific_index, current_item_index, total_items_for_desc in frames_provider:
+            progress_value_for_updater = (current_item_index) / total_items_for_desc if total_items_for_desc > 0 else 1.0
+            # The description string should reflect what current_item_index means
+            item_description = ""
+            if is_video_source:
+                # For video, total_items_in_source_for_description is total raw frames.
+                # current_item_index is the raw frame index of the *sampled* frame.
+                # We also need a counter for *sampled* frames for a "processed X of Y (sampled)" message.
+                # processed_items_count counts sampled frames.
+                item_description = f"Scanning frame {current_item_index}/{total_items_for_desc} (processed {processed_items_count + 1} sampled)"
+            else: # For images
+                item_description = f"image {current_item_index}/{total_items_for_desc}"
+            progress_updater(
+                min(progress_value_for_updater, 1.0), # Cap progress at 1.0
+                desc=f"Processing {item_description} for {source_file_prefix}"
+            )
+            # processed_items_count still counts how many items are yielded by the provider
+            # (i.e., how many sampled frames for video, or how many images for image sequence)
+            processed_items_count += 1
+            try:
+                full_frame_width = pil_image_full_frame.width # Store for percentage calculations
+                print(f"--- Processing item ID {frame_specific_index} (Width: {full_frame_width}px) for {source_file_prefix} ---")
+                # List to hold PIL images that are the primary subjects for this frame
+                # Each element: {'pil': Image, 'base_name': str, 'source_type': 'person'/'halfbody'/'fullframe'}
+                primary_targets_for_frame: List[Dict[str, Any]] = []
+                processed_primary_source_this_frame = False # Flag if Person or HalfBody yielded targets
+                # --- 1. Person Detection ---
+                if enable_person_detection and full_frame_width > 0:
+                    print("  Attempting Person Detection...")
+                    min_person_target_px_width = full_frame_width * min_target_width_person_percentage
+                    person_detections = person_detector.detect_person(
+                        pil_image_full_frame, model_name=person_model_name,
+                        conf_threshold=person_conf_threshold, iou_threshold=person_iou_threshold
+                    )
+                    total_persons_detected_raw += len(person_detections)
+                    if person_detections:
+                        print(f"    Detected {len(person_detections)} raw persons.")
+                        valid_person_targets = 0
+                        for i, (bbox, _, score) in enumerate(person_detections):
+                                # Check width before full crop for minor optimization
+                            detected_person_width = bbox[2] - bbox[0]
+                            if detected_person_width >= min_person_target_px_width:
+                                primary_targets_for_frame.append({
+                                    'pil': pil_image_full_frame.crop(bbox),
+                                    'base_name': f"{source_file_prefix}_item_{frame_specific_index}_person_{i}_score{int(score*100)}",
+                                    'source_type': 'person'})
+                                person_targets_processed_count +=1
+                                valid_person_targets +=1
+                            else:
+                                print(f"      Person {i} width {detected_person_width}px < min {min_person_target_px_width:.0f}px. Skipping.")
+                        if valid_person_targets > 0:
+                            processed_primary_source_this_frame = True
+                            print(f"    Added {valid_person_targets} persons as primary targets.")
+                # --- 2. Half-Body Detection (if Person not processed and HBD enabled) ---
+                if not processed_primary_source_this_frame and enable_halfbody_detection and full_frame_width > 0:
+                    print("  Attempting Half-Body Detection (on full item)...")
+                    min_halfbody_target_px_width = full_frame_width * min_target_width_halfbody_percentage
+                    halfbody_detections = halfbody_detector.detect_halfbody(
+                        pil_image_full_frame, model_name=halfbody_model_name,
+                        conf_threshold=halfbody_conf_threshold, iou_threshold=halfbody_iou_threshold
+                    )
+                    total_halfbodies_detected_raw += len(halfbody_detections)
+                    if halfbody_detections:
+                        print(f"    Detected {len(halfbody_detections)} raw half-bodies.")
+                        valid_halfbody_targets = 0
+                        for i, (bbox, _, score) in enumerate(halfbody_detections):
+                            detected_hb_width = bbox[2] - bbox[0]
+                            # Cropping must be enabled and width must be sufficient for it to be a target
+                            if enable_halfbody_cropping and detected_hb_width >= min_halfbody_target_px_width:
+                                primary_targets_for_frame.append({
+                                    'pil': pil_image_full_frame.crop(bbox),
+                                    'base_name': f"{source_file_prefix}_item_{frame_specific_index}_halfbody_{i}_score{int(score*100)}",
+                                    'source_type': 'halfbody'})
+                                halfbody_targets_processed_count +=1
+                                valid_halfbody_targets +=1
+                            elif enable_halfbody_cropping:
+                                print(f"      Half-body {i} width {detected_hb_width}px < min {min_halfbody_target_px_width:.0f}px. Skipping.")
+                        if valid_halfbody_targets > 0:
+                            processed_primary_source_this_frame = True
+                            print(f"    Added {valid_halfbody_targets} half-bodies as primary targets.")
+                # --- 3. Full Frame/Image (fallback) ---
+                if not processed_primary_source_this_frame:
+                    print("  Processing Full Item as primary target.")
+                    primary_targets_for_frame.append({
+                        'pil': pil_image_full_frame.copy(),
+                        'base_name': f"{source_file_prefix}_item_{frame_specific_index}_full",
+                        'source_type': 'fullframe'})
+                    fullframe_targets_processed_count += 1
+                # --- Process each identified primary_target_for_frame ---
+                for target_data in primary_targets_for_frame:
+                    current_pil: Image.Image = target_data['pil']
+                    current_base_name: str = target_data['base_name'] # Base name for this main target
+                    current_source_type: str = target_data['source_type']
+                    current_pil_width = current_pil.width # For sub-crop percentage calculations
+                    print(f"    Processing target: {current_base_name} (type: {current_source_type}, width: {current_pil_width}px)")
+                    # Store PILs of successful crops from current_pil for this target
+                    keep_this_target = True
+                    item_area = current_pil_width * current_pil.height
+                    potential_face_crops_pil: List[Image.Image] = []
+                    potential_head_crops_pil: List[Image.Image] = []
+                    # --- A. Face Detection ---
+                    if keep_this_target and enable_face_detection and current_pil_width > 0:
+                        print(f"      Detecting faces in {current_base_name}...")
+                        min_face_crop_px_width = current_pil_width * min_crop_width_face_percentage
+                        face_detections = face_detector.detect_faces(
+                            current_pil, model_name=face_model_name,
+                            conf_threshold=face_conf_threshold, iou_threshold=face_iou_threshold
+                        )
+                        total_faces_detected_on_targets += len(face_detections)
+                        if not face_detections and enable_face_filtering:
+                            keep_this_target = False
+                            items_filtered_by_face_count += 1
+                            print(f"        FILTERING TARGET {current_base_name} (no face).")
+                        elif face_detections and enable_face_cropping:
+                            for f_idx, (f_bbox, _, _) in enumerate(face_detections):
+                                if (f_bbox[2]-f_bbox[0]) >= min_face_crop_px_width:
+                                    potential_face_crops_pil.append(current_pil.crop(f_bbox))
+                                else:
+                                    print(f"          Face {f_idx} too small. Skipping crop.")
+                    # --- B. Head Detection ---
+                    if keep_this_target and enable_head_detection and current_pil_width > 0:
+                        print(f"      Detecting heads in {current_base_name}...")
+                        min_head_crop_px_width = current_pil_width * min_crop_width_head_percentage
+                        head_detections = head_detector.detect_heads(
+                            current_pil, model_name=head_model_name,
+                            conf_threshold=head_conf_threshold, iou_threshold=head_iou_threshold
+                        )
+                        total_heads_detected_on_targets += len(head_detections)
+                        if not head_detections and enable_head_filtering:
+                            keep_this_target = False
+                            items_filtered_by_head_count += 1
+                            print(f"        FILTERING TARGET {current_base_name} (no head).")
+                            potential_face_crops_pil.clear() # Clear faces if head filter removed target
+                        elif head_detections and enable_head_cropping:
+                            for h_idx, (h_bbox, _, _) in enumerate(head_detections):
+                                h_w = h_bbox[2]-h_bbox[0] # h_h = h_bbox[3]-h_bbox[1]
+                                if h_w >= min_head_crop_px_width and item_area > 0:
+                                    potential_head_crops_pil.append(current_pil.crop(h_bbox))
+                                else:
+                                    print(f"          Head {h_idx} too small or too large relative to parent. Skipping crop.")
+                    # --- If target is filtered, clean up and skip to next target ---
+                    if not keep_this_target:
+                        print(f"    Target {current_base_name} was filtered by face/head presence rules. Discarding it and its potential crops.")
+                        if current_pil is not None:
+                            del current_pil
+                        potential_face_crops_pil.clear()
+                        potential_head_crops_pil.clear()
+                        continue # To the next primary_target_for_frame
+                    # --- C. CCIP Classification (on current_pil, if it's kept) ---
+                    assigned_ccip_id = None # This is the original CCIP ID
+                    if enable_ccip_classification:
+                        print(f"      Classifying {current_base_name} with CCIP...")
+                        try:
+                            feature = ccip_analyzer.ccip_extract_feature(current_pil, model=ccip_model_name)
+                            best_match_cid = None
+                            min_diff = float('inf')
+                            # Find the best potential match among existing clusters
+                            if ccip_clusters_info: # Only loop if there are clusters to compare against
+                                for cid, rep_f in ccip_clusters_info:
+                                    diff = ccip_analyzer.ccip_difference(feature, rep_f, model=ccip_model_name)
+                                    if diff < min_diff:
+                                        min_diff = diff
+                                        best_match_cid = cid
+                            # Decide whether to use the best match or create a new cluster
+                            if best_match_cid is not None and min_diff < ccip_threshold:
+                                assigned_ccip_id = best_match_cid
+                                print(f"        -> Matched Cluster {assigned_ccip_id} (Diff: {min_diff:.6f} <= Threshold {ccip_threshold:.3f})")
+                            else:
+                                # No suitable match found (either no clusters existed, or the best match's diff was strictly greater than threshold)
+                                # Create a new cluster
+                                assigned_ccip_id = next_ccip_cluster_id
+                                ccip_clusters_info.append((assigned_ccip_id, feature))
+                                if not ccip_clusters_info or len(ccip_clusters_info) == 1:
+                                    print(f"        -> New Cluster {assigned_ccip_id} (First item or no prior suitable clusters)")
+                                else:
+                                    # MODIFIED: Log message reflecting that new cluster is formed if diff > threshold
+                                    print(f"        -> New Cluster {assigned_ccip_id} (Min diff to others: {min_diff:.6f} > Threshold {ccip_threshold:.3f})")
+                                next_ccip_cluster_id += 1
+                            print(f"      CCIP: Target {current_base_name} -> Original Cluster ID {assigned_ccip_id}")
+                            del feature
+                            ccip_applied_count += 1
+                        except Exception as e_ccip:
+                            print(f"      Error CCIP: {e_ccip}")
+                    # --- D. Aesthetic Analysis (on current_pil, if it's kept) ---
+                    item_aesthetic_label = None
+                    if enable_aesthetic_analysis:
+                        print(f"      Analyzing {current_base_name} for aesthetics...")
+                        try:
+                            res = dbaesthetic_analyzer.anime_dbaesthetic(current_pil, model_name=aesthetic_model_name)
+                            if isinstance(res, tuple) and len(res) >= 1:
+                                item_aesthetic_label = res[0]
+                            print(f"      Aesthetic: Target {current_base_name} -> {item_aesthetic_label}")
+                            aesthetic_applied_count += 1
+                        except Exception as e_aes:
+                            print(f"      Error Aesthetic: {e_aes}")
+                    add_current_pil_to_pending_list = True
+                    if current_source_type == 'fullframe':
+                        can_skip_fullframe_target = False
+                        if enable_face_detection or enable_head_detection:
+                            found_valid_sub_crop_from_enabled_detector = False
+                            if enable_face_detection and len(potential_face_crops_pil) > 0:
+                                found_valid_sub_crop_from_enabled_detector = True
+                            if not found_valid_sub_crop_from_enabled_detector and \
+                               enable_head_detection and len(potential_head_crops_pil) > 0:
+                                found_valid_sub_crop_from_enabled_detector = True
+                            if not found_valid_sub_crop_from_enabled_detector: # No valid crops from any enabled sub-detector
+                                can_skip_fullframe_target = True # All enabled sub-detectors failed
+                        if can_skip_fullframe_target:
+                            add_current_pil_to_pending_list = False
+                            print(f"      Skipping save of fullframe target '{current_base_name}' because all enabled sub-detectors (Face/Head) yielded no valid-width crops.")
+                    if add_current_pil_to_pending_list:
+                        # --- E. Save current_pil (if it passed all filters) ---
+                        # Add main target to pending list
+                        images_pending_final_processing.append({
+                            'pil_image': current_pil.copy(), 'base_name_for_filename': current_base_name,
+                            'ccip_cluster_id': assigned_ccip_id, 'aesthetic_label': item_aesthetic_label,
+                            'is_halfbody_primary_target_type': (current_source_type == 'halfbody'),
+                            'is_derived_head_crop': False, 'is_derived_face_crop': False,
+                            'lpips_cluster_id': None, # Will be filled by LPIPS clustering
+                            'lpips_folder_naming_index': None # Will be filled by LPIPS renaming
+                        })
+                        main_targets_pending_count +=1
+                    # --- F. Save Face Crops (derived from current_pil) ---
+                    for i, fc_pil in enumerate(potential_face_crops_pil):
+                        images_pending_final_processing.append({
+                            'pil_image': fc_pil, 'base_name_for_filename': f"{current_base_name}_face{i}",
+                            'ccip_cluster_id': assigned_ccip_id, 'aesthetic_label': item_aesthetic_label,
+                            'is_halfbody_primary_target_type': False,
+                            'is_derived_head_crop': False, 'is_derived_face_crop': True,
+                            'lpips_cluster_id': None,
+                            'lpips_folder_naming_index': None
+                        })
+                        face_crops_pending_count+=1
+                    potential_face_crops_pil.clear()
+                    # --- G. Save Head Crops (derived from current_pil) ---
+                    for i, hc_pil in enumerate(potential_head_crops_pil):
+                        images_pending_final_processing.append({
+                            'pil_image': hc_pil, 'base_name_for_filename': f"{current_base_name}_head{i}",
+                            'ccip_cluster_id': assigned_ccip_id, 'aesthetic_label': item_aesthetic_label,
+                            'is_halfbody_primary_target_type': False,
+                            'is_derived_head_crop': True, 'is_derived_face_crop': False,
+                            'lpips_cluster_id': None,
+                            'lpips_folder_naming_index': None
+                        })
+                        head_crops_pending_count+=1
+                    potential_head_crops_pil.clear()
+                    if current_pil is not None: # Ensure current_pil exists before attempting to delete
+                        del current_pil # Clean up the PIL for this target_data
+                primary_targets_for_frame.clear()
+            except Exception as item_proc_err:
+                print(f"!! Major Error processing item ID {frame_specific_index} for {source_file_prefix}: {item_proc_err}")
+                traceback.print_exc()
+                # Cleanup local vars for this item if error
+                if 'primary_targets_for_frame' in locals():
+                    primary_targets_for_frame.clear()
+                # Also ensure current_pil from inner loop is cleaned up if error happened mid-loop
+                if 'current_pil' in locals() and current_pil is not None:
+                    del current_pil
+            if processed_items_count % gc_interval == 0:
+                gc.collect()
+                print(f"  [GC triggered at {processed_items_count} items for {source_file_prefix}]")
+        # --- End of Main Item Processing Loop ---
+        print(f"\nRunning final GC before LPIPS/Zipping for {source_file_prefix}...")
+        gc.collect()
+        if not images_pending_final_processing:
+            status_message = f"Processing for {source_file_prefix} finished, but no images were generated or passed filters for LPIPS/Zipping."
+            print(status_message)
+            return None, status_message
+        # --- LPIPS Clustering Stage ---
+        print(f"\n--- LPIPS Clustering Stage for {source_file_prefix} (Images pending: {len(images_pending_final_processing)}) ---")
+        if enable_lpips_clustering:
+            print(f"  LPIPS Clustering enabled with threshold: {lpips_threshold}")
+            lpips_images_subject_to_clustering = len(images_pending_final_processing)
+            if enable_ccip_classification and next_ccip_cluster_id > 0: # CCIP was used
+                print("  LPIPS clustering within CCIP clusters.")
+                images_by_ccip: Dict[Optional[int], List[int]] = {} # ccip_id -> list of original indices
+                for i, item_data in enumerate(images_pending_final_processing):
+                    ccip_id = item_data['ccip_cluster_id'] # Original CCIP ID
+                    if ccip_id not in images_by_ccip:
+                        images_by_ccip[ccip_id] = []
+                    images_by_ccip[ccip_id].append(i)
+                for ccip_id, indices_in_ccip_cluster in images_by_ccip.items():
+                    pils_for_lpips_sub_cluster = [images_pending_final_processing[idx]['pil_image'] for idx in indices_in_ccip_cluster]
+                    if len(pils_for_lpips_sub_cluster) > 1:
+                        print(f"    Clustering {len(pils_for_lpips_sub_cluster)} images in CCIP cluster {ccip_id}...")
+                        try:
+                            lpips_sub_ids = lpips_module.lpips_clustering(pils_for_lpips_sub_cluster, threshold=lpips_threshold)
+                            for i_sub, lpips_id in enumerate(lpips_sub_ids):
+                                original_idx = indices_in_ccip_cluster[i_sub]
+                                images_pending_final_processing[original_idx]['lpips_cluster_id'] = lpips_id
+                        except Exception as e_lpips_sub:
+                            print(f"      Error LPIPS sub-cluster CCIP {ccip_id}: {e_lpips_sub}")
+                    elif len(pils_for_lpips_sub_cluster) == 1:
+                         images_pending_final_processing[indices_in_ccip_cluster[0]]['lpips_cluster_id'] = 0 # type: ignore
+                del images_by_ccip
+                if 'pils_for_lpips_sub_cluster' in locals():
+                    del pils_for_lpips_sub_cluster # Ensure cleanup
+            else: # LPIPS on all images globally
+                print("  LPIPS clustering on all collected images.")
+                all_pils_for_global_lpips = [item['pil_image'] for item in images_pending_final_processing]
+                if len(all_pils_for_global_lpips) > 1:
+                    try:
+                        lpips_global_ids = lpips_module.lpips_clustering(all_pils_for_global_lpips, threshold=lpips_threshold)
+                        for i, lpips_id in enumerate(lpips_global_ids):
+                            images_pending_final_processing[i]['lpips_cluster_id'] = lpips_id
+                    except Exception as e_lpips_global:
+                        print(f"      Error LPIPS global: {e_lpips_global}")
+                elif len(all_pils_for_global_lpips) == 1:
+                    images_pending_final_processing[0]['lpips_cluster_id'] = 0 # type: ignore
+                del all_pils_for_global_lpips
+            # Calculate LPIPS stats
+            all_final_lpips_ids = [item.get('lpips_cluster_id') for item in images_pending_final_processing if item.get('lpips_cluster_id') is not None]
+            if all_final_lpips_ids:
+                unique_lpips_clusters = set(filter(lambda x: x != -1, all_final_lpips_ids))
+                total_lpips_clusters_created = len(unique_lpips_clusters)
+                total_lpips_noise_samples = sum(1 for x in all_final_lpips_ids if x == -1)
+        else:
+            print("  LPIPS Clustering disabled.")
+        # --- CCIP Folder Renaming Logic ---
+        original_ccip_id_to_new_naming_index: Dict[int, int] = {}
+        if enable_ccip_classification:
+            print(f"  Preparing CCIP folder renaming for {source_file_prefix}...")
+            ccip_image_counts: Dict[int, int] = {} # original_ccip_id -> count of images in it
+            for item_data_for_count in images_pending_final_processing:
+                original_ccip_id_val = item_data_for_count.get('ccip_cluster_id')
+                if original_ccip_id_val is not None:
+                    ccip_image_counts[original_ccip_id_val] = ccip_image_counts.get(original_ccip_id_val, 0) + 1
+            if ccip_image_counts:
+                # Sort original ccip_ids by their counts in descending order
+                sorted_ccip_groups_by_count: List[Tuple[int, int]] = sorted(
+                    ccip_image_counts.items(),
+                    key=lambda item: item[1],  # Sort by count
+                    reverse=True
+                )
+                for new_idx, (original_id, count) in enumerate(sorted_ccip_groups_by_count):
+                    original_ccip_id_to_new_naming_index[original_id] = new_idx
+                    print(f"    CCIP Remap for {source_file_prefix}: Original ID {original_id} (count: {count}) -> New Naming Index {new_idx:03d}")
+            else:
+                print(f"    No CCIP-assigned images found for {source_file_prefix} to perform renaming.")
+        # --- LPIPS Folder Renaming Logic ---
+        if enable_lpips_clustering:
+            print(f"  Preparing LPIPS folder renaming for {source_file_prefix}...")
+            # Initialize/Reset lpips_folder_naming_index for all items
+            for item_data in images_pending_final_processing:
+                item_data['lpips_folder_naming_index'] = None
+            if enable_ccip_classification and next_ccip_cluster_id > 0: # LPIPS within CCIP
+                print(f"    LPIPS renaming within CCIP clusters for {source_file_prefix}.")
+                items_grouped_by_original_ccip: Dict[Optional[int], List[Dict[str, Any]]] = {}
+                for item_data in images_pending_final_processing:
+                    original_ccip_id = item_data.get('ccip_cluster_id')
+                    if original_ccip_id not in items_grouped_by_original_ccip: items_grouped_by_original_ccip[original_ccip_id] = []
+                    items_grouped_by_original_ccip[original_ccip_id].append(item_data)
+                for original_ccip_id, items_in_ccip in items_grouped_by_original_ccip.items():
+                    lpips_counts_in_ccip: Dict[int, int] = {} # original_lpips_id (non-noise) -> count
+                    for item_data in items_in_ccip:
+                        lpips_id = item_data.get('lpips_cluster_id')
+                        if lpips_id is not None and lpips_id != -1:
+                            lpips_counts_in_ccip[lpips_id] = lpips_counts_in_ccip.get(lpips_id, 0) + 1
+                    lpips_id_to_naming_in_ccip: Dict[int, Union[int, str]] = {}
+                    if lpips_counts_in_ccip:
+                        sorted_lpips = sorted(lpips_counts_in_ccip.items(), key=lambda x: x[1], reverse=True)
+                        for new_idx, (lpips_id, count) in enumerate(sorted_lpips):
+                            lpips_id_to_naming_in_ccip[lpips_id] = new_idx
+                            ccip_disp = f"OrigCCIP-{original_ccip_id}" if original_ccip_id is not None else "NoCCIP"
+                            print(f"      LPIPS Remap in {ccip_disp}: OrigLPIPS ID {lpips_id} (count: {count}) -> New Naming Index {new_idx:03d}")
+                    for item_data in items_in_ccip:
+                        lpips_id = item_data.get('lpips_cluster_id')
+                        if lpips_id is not None:
+                            if lpips_id == -1: item_data['lpips_folder_naming_index'] = "noise"
+                            elif lpips_id in lpips_id_to_naming_in_ccip:
+                                item_data['lpips_folder_naming_index'] = lpips_id_to_naming_in_ccip[lpips_id]
+                del items_grouped_by_original_ccip
+            else: # Global LPIPS
+                print(f"    Global LPIPS renaming for {source_file_prefix}.")
+                global_lpips_counts: Dict[int, int] = {}
+                for item_data in images_pending_final_processing:
+                    lpips_id = item_data.get('lpips_cluster_id')
+                    if lpips_id is not None and lpips_id != -1:
+                        global_lpips_counts[lpips_id] = global_lpips_counts.get(lpips_id, 0) + 1
+                global_lpips_id_to_naming: Dict[int, Union[int, str]] = {}
+                if global_lpips_counts:
+                    sorted_global_lpips = sorted(global_lpips_counts.items(), key=lambda x: x[1], reverse=True)
+                    for new_idx, (lpips_id, count) in enumerate(sorted_global_lpips):
+                        global_lpips_id_to_naming[lpips_id] = new_idx
+                        print(f"      Global LPIPS Remap: OrigLPIPS ID {lpips_id} (count: {count}) -> New Naming Index {new_idx:03d}")
+                for item_data in images_pending_final_processing:
+                    lpips_id = item_data.get('lpips_cluster_id')
+                    if lpips_id is not None:
+                        if lpips_id == -1: item_data['lpips_folder_naming_index'] = "noise"
+                        elif lpips_id in global_lpips_id_to_naming:
+                            item_data['lpips_folder_naming_index'] = global_lpips_id_to_naming[lpips_id]
+            gc.collect()
+        # --- Final Zipping Stage ---
+        images_to_zip: Dict[str, bytes] = {}
+        print(f"\n--- Final Zipping Stage for {source_file_prefix} ({len(images_pending_final_processing)} items) ---")
+        for item_data in images_pending_final_processing:
+            original_ccip_id_for_item = item_data.get('ccip_cluster_id')
+            current_ccip_naming_idx_for_folder: Optional[int] = None
+            if enable_ccip_classification and original_ccip_id_for_item is not None and \
+               original_ccip_id_for_item in original_ccip_id_to_new_naming_index:
+                current_ccip_naming_idx_for_folder = original_ccip_id_to_new_naming_index[original_ccip_id_for_item]
+            current_lpips_naming_idx_for_folder = item_data.get('lpips_folder_naming_index')
+            final_filename = generate_filename(
+                base_name=item_data['base_name_for_filename'],
+                aesthetic_label=item_data.get('aesthetic_label'),
+                ccip_cluster_id_for_lpips_logic=original_ccip_id_for_item,
+                ccip_folder_naming_index=current_ccip_naming_idx_for_folder,
+                source_prefix_for_ccip_folder=source_file_prefix if current_ccip_naming_idx_for_folder is not None else None,
+                lpips_folder_naming_index=current_lpips_naming_idx_for_folder,
+                is_halfbody_primary_target_type=item_data['is_halfbody_primary_target_type'],
+                is_derived_head_crop=item_data['is_derived_head_crop'],
+                is_derived_face_crop=item_data['is_derived_face_crop']
+            )
+            try:
+                images_to_zip[final_filename] = image_to_bytes(item_data['pil_image'])
+            except Exception as e_bytes:
+                print(f"  Error converting/adding {final_filename} to zip: {e_bytes}")
+            finally:
+                if 'pil_image' in item_data and item_data['pil_image'] is not None:
+                    del item_data['pil_image']
+        images_pending_final_processing.clear()
+        if not images_to_zip:
+            status_message = f"Processing for {source_file_prefix} finished, but no images were converted for zipping."
+            print(status_message)
+            return None, status_message
+        print(f"Preparing zip file for {source_file_prefix} with {len(images_to_zip)} images...")
+        progress_updater(1.0, desc=f"Creating Zip File for {source_file_prefix}...")
+        zip_start_time = time.time()
+        # Use NamedTemporaryFile with delete=False for the final output path
+        # This file will persist until manually cleaned or OS cleanup
+        temp_zip_file = tempfile.NamedTemporaryFile(delete=False, suffix=".zip")
+        output_zip_path_temp = temp_zip_file.name
+        temp_zip_file.close() # Close the handle, but file remains
+        try:
+            # Write data to the temporary file path
+            create_zip_file(images_to_zip, output_zip_path_temp)
+            zip_duration = time.time() - zip_start_time
+            print(f"Temporary zip file for {source_file_prefix} created in {zip_duration:.2f} seconds at {output_zip_path_temp}")
+            # Construct the new, desired filename
+            temp_dir = os.path.dirname(output_zip_path_temp)
+            timestamp = int(time.time())
+            desired_filename = f"{source_file_prefix}_processed_{timestamp}.zip"
+            output_zip_path_final = os.path.join(temp_dir, desired_filename)
+            # Rename the temporary file to the desired name
+            print(f"Renaming temp file for {source_file_prefix} to: {output_zip_path_final}")
+            os.rename(output_zip_path_temp, output_zip_path_final)
+            print("Rename successful.")
+            output_zip_path_temp = None # Clear temp path as it's been renamed
+        except Exception as zip_or_rename_err:
+            print(f"Error during zip creation or renaming for {source_file_prefix}: {zip_or_rename_err}")
+            # Clean up the *original* temp file if it still exists and renaming failed
+            if output_zip_path_temp and os.path.exists(output_zip_path_temp):
+                try:
+                    os.remove(output_zip_path_temp)
+                except OSError:
+                    pass
+            if output_zip_path_final and os.path.exists(output_zip_path_final): # Check if rename partially happened
+                try:
+                    os.remove(output_zip_path_final)
+                except OSError:
+                    pass
+            raise zip_or_rename_err # Re-raise the error
+        # --- Prepare Status Message ---
+        processing_duration = time.time() - start_time - zip_duration # Exclude zipping time from processing time
+        total_duration = time.time() - start_time # Includes zipping/renaming
+        # --- Build final status message ---
+        person_stats = "N/A"
+        if enable_person_detection:
+            person_stats = f"{total_persons_detected_raw} raw, {person_targets_processed_count} targets (>{min_target_width_person_percentage*100:.1f}% itemW)"
+        halfbody_stats = "N/A"
+        if enable_halfbody_detection:
+            halfbody_stats = f"{total_halfbodies_detected_raw} raw, {halfbody_targets_processed_count} targets (>{min_target_width_halfbody_percentage*100:.1f}% itemW)"
+        fullframe_stats = f"{fullframe_targets_processed_count} targets"
+        face_stats = "N/A"
+        if enable_face_detection:
+            face_stats = f"{total_faces_detected_on_targets} on targets, {face_crops_pending_count} crops pending (>{min_crop_width_face_percentage*100:.1f}% parentW)"
+            if enable_face_filtering:
+                face_stats += f", {items_filtered_by_face_count} targets filtered"
+        head_stats = "N/A"
+        if enable_head_detection:
+            head_stats = f"{total_heads_detected_on_targets} on targets, {head_crops_pending_count} crops pending (>{min_crop_width_head_percentage*100:.1f}% parentW)"
+            if enable_head_filtering:
+                head_stats += f", {items_filtered_by_head_count} targets filtered"
+        ccip_stats = "N/A"
+        if enable_ccip_classification:
+            ccip_stats = f"{next_ccip_cluster_id} original clusters created, on {ccip_applied_count} targets. Folders renamed by image count."
+        lpips_stats = "N/A"
+        if enable_lpips_clustering:
+            lpips_stats = f"{lpips_images_subject_to_clustering} images processed, {total_lpips_clusters_created} clusters, {total_lpips_noise_samples} noise. Folders renamed by image count."
+        aesthetic_stats = "N/A"
+        if enable_aesthetic_analysis:
+            aesthetic_stats = f"On {aesthetic_applied_count} targets"
+        item_desc_for_stats = "Items from Provider" if not is_video_source else "Sampled Frames"
+        status_message = (
+            f"Processing for '{source_file_prefix}' Complete!\n"
+            f"Total time: {total_duration:.2f}s (Proc: {processing_duration:.2f}s, Zip: {zip_duration:.2f}s)\n"
+            f"{item_desc_for_stats}: {total_items_for_desc}, Processed Items: {processed_items_count}\n"
+            f"--- Primary Targets Processed ---\n"
+            f"  Person Detection: {person_stats}\n"
+            f"  Half-Body Detection: {halfbody_stats}\n"
+            f"  Full Item Processing: {fullframe_stats}\n"
+            f"--- Items Pending Final Processing ({main_targets_pending_count} main, {face_crops_pending_count} face, {head_crops_pending_count} head) ---\n"
+            f"  Face Detection: {face_stats}\n"
+            f"  Head Detection: {head_stats}\n"
+            f"  CCIP Classification: {ccip_stats}\n"
+            f"  LPIPS Clustering: {lpips_stats}\n"
+            f"  Aesthetic Analysis: {aesthetic_stats}\n"
+            f"Zip file contains {len(images_to_zip)} images.\n"
+            f"Output Zip: {output_zip_path_final}"
+        )
+        print(status_message)
+        progress_updater(1.0, desc=f"Finished {source_file_prefix}!")
+        # Return the path to the zip file
+        return output_zip_path_final, status_message
+    except Exception as e:
+        print(f"!! An unhandled error occurred during processing of {source_file_prefix}: {e}")
+        traceback.print_exc() # Print detailed traceback for debugging
+        # Clean up main data structures
+        images_pending_final_processing.clear()
+        ccip_clusters_info.clear()
+        gc.collect()
+        # Clean up temp file if it exists on general error
+        if output_zip_path_temp and os.path.exists(output_zip_path_temp):
+            try:
+                os.remove(output_zip_path_temp)
+            except OSError:
+                pass
+        # Clean up final file if it exists on general error (maybe renaming succeeded but later code failed)
+        if output_zip_path_final and os.path.exists(output_zip_path_final):
+            try:
+                os.remove(output_zip_path_final)
+            except OSError:
+                pass
+        return None, f"An error occurred with {source_file_prefix}: {e}"
+# --- Main Processing Function for Input files ---
+def process_inputs_main(
+    input_file_objects: List[Any], # Gradio File component gives list of tempfile._TemporaryFileWrapper
+    sample_interval_ms: int, # Relevant for videos only
+    # Person Detection
+    enable_person_detection: bool,
+    min_target_width_person_percentage: float,
+    person_model_name: str,
+    person_conf_threshold: float,
+    person_iou_threshold: float,
+    # Half-Body Detection
+    enable_halfbody_detection: bool,
+    enable_halfbody_cropping: bool,
+    min_target_width_halfbody_percentage: float,
+    halfbody_model_name: str,
+    halfbody_conf_threshold: float,
+    halfbody_iou_threshold: float,
+    # Head Detection
+    enable_head_detection: bool,
+    enable_head_cropping: bool,
+    min_crop_width_head_percentage: float,
+    enable_head_filtering: bool,
+    head_model_name: str,
+    head_conf_threshold: float,
+    head_iou_threshold: float,
+    # Face Detection
+    enable_face_detection: bool,
+    enable_face_cropping: bool,
+    min_crop_width_face_percentage: float,
+    enable_face_filtering: bool,
+    face_model_name: str,
+    face_conf_threshold: float,
+    face_iou_threshold: float,
+    # CCIP Classification
+    enable_ccip_classification: bool,
+    ccip_model_name: str,
+    ccip_threshold: float,
+    # LPIPS Clustering
+    enable_lpips_clustering: bool,
+    lpips_threshold: float,
+    # Aesthetic Analysis
+    enable_aesthetic_analysis: bool,
+    aesthetic_model_name: str,
+    progress=gr.Progress(track_tqdm=True) # Gradio progress for overall processing
+) -> Tuple[Optional[List[str]], str]: # Returns list of ZIP paths and combined status
+    if not input_file_objects:
+        return [], "Error: No files provided."
+    video_file_temp_objects: List[Any] = []
+    image_file_temp_objects: List[Any] = []
+    for file_obj in input_file_objects:
+        # gr.Files returns a list of tempfile._TemporaryFileWrapper objects
+        # We need the .name attribute to get the actual file path
+        file_name = getattr(file_obj, 'orig_name', file_obj.name) # Use original name if available
+        if isinstance(file_name, str):
+            lower_file_name = file_name.lower()
+            if any(lower_file_name.endswith(ext) for ext in VIDEO_EXTENSIONS):
+                video_file_temp_objects.append(file_obj)
+            elif any(lower_file_name.endswith(ext) for ext in IMAGE_EXTENSIONS):
+                image_file_temp_objects.append(file_obj)
+            else:
+                print(f"Warning: File '{file_name}' has an unrecognized extension and will be skipped.")
+        else:
+            print(f"Warning: File object {file_obj} does not have a valid name and will be skipped.")
+    output_zip_paths_all_sources = []
+    all_status_messages = []
+    total_processing_tasks = (1 if image_file_temp_objects else 0) + len(video_file_temp_objects)
+    if total_processing_tasks == 0:
+        return [], "No processable video or image files found in the input."
+    tasks_completed_count = 0
+    # Print overall settings once
+    print(f"--- Overall Batch Processing Settings ---")
+    print(f"  Number of image sequences to process: {1 if image_file_temp_objects else 0}")
+    print(f"  Number of videos to process: {len(video_file_temp_objects)}")
+    print(f"  Sample Interval (for videos): {sample_interval_ms}ms")
+    print(f"  Detection Order: Person => Half-Body (alt) => Face => Head. Then: CCIP => LPIPS => Aesthetic.")
+    print(f"  Person Detect = {enable_person_detection}" + (f" (MinW:{min_target_width_person_percentage*100:.1f}%, Mdl:{person_model_name}, Conf:{person_conf_threshold:.2f}, IoU:{person_iou_threshold:.2f})" if enable_person_detection else ""))
+    print(f"  HalfBody Detect = {enable_halfbody_detection}" + (f" (FullFrameOnly, Crop:{enable_halfbody_cropping}, MinW:{min_target_width_halfbody_percentage*100:.1f}%, Mdl:{halfbody_model_name}, Conf:{halfbody_conf_threshold:.2f}, IoU:{halfbody_iou_threshold:.2f})" if enable_halfbody_detection else ""))
+    print(f"  Face Detect = {enable_face_detection}" + (f" (Crop:{enable_face_cropping}, MinW:{min_crop_width_face_percentage*100:.1f}%, Filter:{enable_face_filtering}, Mdl:{face_model_name}, Conf:{face_conf_threshold:.2f}, IoU:{face_iou_threshold:.2f})" if enable_face_detection else ""))
+    print(f"  Head Detect = {enable_head_detection}" + (f" (Crop:{enable_head_cropping}, MinW:{min_crop_width_head_percentage*100:.1f}%, Filter:{enable_head_filtering}, Mdl:{head_model_name}, Conf:{head_conf_threshold:.2f}, IoU:{head_iou_threshold:.2f})" if enable_head_detection else ""))
+    print(f"  CCIP Classify = {enable_ccip_classification}" + (f" (Mdl:{ccip_model_name}, Thr:{ccip_threshold:.3f})" if enable_ccip_classification else ""))
+    print(f"  LPIPS Clustering = {enable_lpips_clustering}" + (f" (Thr:{lpips_threshold:.3f})" if enable_lpips_clustering else ""))
+    print(f"  Aesthetic Analyze = {enable_aesthetic_analysis}" + (f" (Mdl:{aesthetic_model_name})" if enable_aesthetic_analysis else ""))
+    print(f"--- End of Overall Settings ---")
+    # --- Process Image Sequence (if any) ---
+    if image_file_temp_objects:
+        image_group_label_base = "ImageGroup"
+        # Attempt to use first image name for more uniqueness, fallback to timestamp
+        try:
+            first_image_orig_name = getattr(image_file_temp_objects[0], 'orig_name', image_file_temp_objects[0].name)
+            image_group_label_base = sanitize_filename(first_image_orig_name, max_len=20)
+        except:
+            pass # Stick with "ImageGroup"
+        image_source_file_prefix = f"{image_group_label_base}_{int(time.time())}"
+        current_task_number = tasks_completed_count + 1
+        progress_description_prefix = f"Image Seq. {current_task_number}/{total_processing_tasks} ({image_source_file_prefix})"
+        progress(tasks_completed_count / total_processing_tasks, desc=f"{progress_description_prefix}: Starting...")
+        print(f"\n>>> Processing Image Sequence: {image_source_file_prefix} ({len(image_file_temp_objects)} images) <<<")
+        def image_frames_provider_generator() -> Iterator[Tuple[Image.Image, int, int, int]]:
+            num_images = len(image_file_temp_objects)
+            for idx, img_obj in enumerate(image_file_temp_objects):
+                try:
+                    pil_img = Image.open(img_obj.name).convert('RGB')
+                    yield pil_img, idx, idx + 1, num_images
+                except Exception as e_load:
+                    print(f"Error loading image {getattr(img_obj, 'orig_name', img_obj.name)}: {e_load}. Skipping.")
+                    # If we skip, the total_items_in_source for _process_input_source_frames might be off
+                    # For simplicity, we'll proceed, but this could be refined to adjust total_items dynamically.
+                    # Or, pre-filter loadable images. For now, just skip.
+                    continue
+        def image_group_progress_updater(item_progress_value: float, desc: str):
+            overall_progress = (tasks_completed_count + item_progress_value) / total_processing_tasks
+            progress(overall_progress, desc=f"{progress_description_prefix}: {desc}")
+        try:
+            zip_file_path_single, status_message_single = _process_input_source_frames(
+                source_file_prefix=image_source_file_prefix,
+                frames_provider=image_frames_provider_generator(),
+                is_video_source=False,
+                enable_person_detection=enable_person_detection,
+                min_target_width_person_percentage=min_target_width_person_percentage,
+                person_model_name=person_model_name,
+                person_conf_threshold=person_conf_threshold,
+                person_iou_threshold=person_iou_threshold,
+                enable_halfbody_detection=enable_halfbody_detection,
+                enable_halfbody_cropping=enable_halfbody_cropping,
+                min_target_width_halfbody_percentage=min_target_width_halfbody_percentage,
+                halfbody_model_name=halfbody_model_name,
+                halfbody_conf_threshold=halfbody_conf_threshold,
+                halfbody_iou_threshold=halfbody_iou_threshold,
+                enable_head_detection=enable_head_detection,
+                enable_head_cropping=enable_head_cropping,
+                min_crop_width_head_percentage=min_crop_width_head_percentage,
+                enable_head_filtering=enable_head_filtering,
+                head_model_name=head_model_name,
+                head_conf_threshold=head_conf_threshold,
+                head_iou_threshold=head_iou_threshold,
+                enable_face_detection=enable_face_detection,
+                enable_face_cropping=enable_face_cropping,
+                min_crop_width_face_percentage=min_crop_width_face_percentage,
+                enable_face_filtering=enable_face_filtering,
+                face_model_name=face_model_name,
+                face_conf_threshold=face_conf_threshold,
+                face_iou_threshold=face_iou_threshold,
+                enable_ccip_classification=enable_ccip_classification,
+                ccip_model_name=ccip_model_name,
+                ccip_threshold=ccip_threshold,
+                enable_lpips_clustering=enable_lpips_clustering,
+                lpips_threshold=lpips_threshold,
+                enable_aesthetic_analysis=enable_aesthetic_analysis,
+                aesthetic_model_name=aesthetic_model_name,
+                progress_updater=image_group_progress_updater
+            )
+            if zip_file_path_single:
+                output_zip_paths_all_sources.append(zip_file_path_single)
+                all_status_messages.append(f"--- Image Sequence ({image_source_file_prefix}) Processing Succeeded ---\n{status_message_single}")
+            else:
+                all_status_messages.append(f"--- Image Sequence ({image_source_file_prefix}) Processing Failed ---\n{status_message_single}")
+        except Exception as e_img_seq:
+            error_msg = f"Critical error during processing of image sequence {image_source_file_prefix}: {e_img_seq}"
+            print(error_msg)
+            traceback.print_exc()
+            all_status_messages.append(f"--- Image Sequence ({image_source_file_prefix}) Processing CRITICALLY FAILED ---\n{error_msg}")
+        tasks_completed_count += 1
+        print(f">>> Finished attempt for Image Sequence: {image_source_file_prefix} <<<")
+    # --- Process Video Files (if any) ---
+    for video_idx, video_file_temp_obj in enumerate(video_file_temp_objects):
+        video_path_temp = video_file_temp_obj.name
+        video_original_filename = os.path.basename(getattr(video_file_temp_obj, 'orig_name', video_path_temp))
+        video_source_file_prefix = sanitize_filename(video_original_filename)
+        current_task_number = tasks_completed_count + 1
+        progress_description_prefix = f"Video {current_task_number}/{total_processing_tasks}"
+        print(f"\n>>> Processing Video: {video_original_filename} (Sanitized Prefix: {video_source_file_prefix}) <<<")
+        progress(tasks_completed_count / total_processing_tasks, desc=f"{progress_description_prefix}: Starting processing...")
+        # It yields: (PIL.Image, frame_identifier_string, current_raw_frame_index_from_video, total_items_for_desc)
+        # The third element will be the raw frame number based on CAP_PROP_POS_FRAMES or current_pos_ms
+        # to align progress with total_items_for_desc (raw frame count).
+        def video_frames_provider_generator(video_path: str, interval_ms: int) -> Iterator[Tuple[Image.Image, int, int, int]]:
+            cap = cv2.VideoCapture(video_path)
+            if not cap.isOpened():
+                print(f"Error: Could not open video file for provider: {video_path}")
+                return
+            total_items_for_desc = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+            if total_items_for_desc <= 0:
+                print(f"Warning: Video {video_original_filename} reported {total_items_for_desc} frames. This might be inaccurate. Proceeding...")
+                # If it's 0, the progress in _process_input_source_frames might behave unexpectedly.
+                # Setting to 1 to avoid division by zero, but this means progress won't be very useful.
+                total_items_for_desc = 1 # Fallback to prevent division by zero
+            # processed_count_in_provider = 0 # Counts *sampled* frames, not used for progress index
+            last_processed_ms = -float('inf')
+            raw_frames_read_by_provider = 0 # Counts all frames read by cap.read()
+            try:
+                while True:
+                    # For progress, use current_pos_ms or CAP_PROP_POS_FRAMES
+                    # CAP_PROP_POS_FRAMES is a 0-based index of the next frame to be decoded/captured.
+                    current_raw_frame_index = int(cap.get(cv2.CAP_PROP_POS_FRAMES)) # Use this for progress
+                    current_pos_ms_in_provider = cap.get(cv2.CAP_PROP_POS_MSEC)
+                    # Loop break condition (more robust)
+                    if raw_frames_read_by_provider > 0 and current_pos_ms_in_provider <= last_processed_ms and interval_ms > 0 :
+                         # If interval_ms is 0 or very small, current_pos_ms might not advance much for consecutive reads.
+                         # Adding a check for raw_frames_read_by_provider against a large number or CAP_PROP_FRAME_COUNT
+                         # could be an additional safety, but CAP_PROP_FRAME_COUNT can be unreliable.
+                         # The ret_frame check is the primary exit.
+                        pass # Let ret_frame handle the actual end. This check is for stuck videos.
+                    should_process_this_frame = current_pos_ms_in_provider >= last_processed_ms + interval_ms - 1
+                    ret_frame, frame_cv_data = cap.read()
+                    if not ret_frame: # Primary exit point for the loop
+                        break
+                    raw_frames_read_by_provider +=1 # Incremented after successful read
+                    if should_process_this_frame:
+                        try:
+                            pil_img = convert_to_pil(frame_cv_data)
+                            last_processed_ms = current_pos_ms_in_provider
+                            yield pil_img, int(current_pos_ms_in_provider), current_raw_frame_index + 1, total_items_for_desc # Yield 1-based raw frame index
+                        except Exception as e_conv:
+                            print(f"Error converting frame at {current_pos_ms_in_provider}ms (raw index {current_raw_frame_index}) for {video_original_filename}: {e_conv}. Skipping.")
+                        finally:
+                            pass
+            finally:
+                if cap.isOpened():
+                    cap.release()
+                    print(f"   Video capture for provider ({video_original_filename}) released.")
+        def video_progress_updater(item_progress_value: float, desc: str):
+            overall_progress = (tasks_completed_count + item_progress_value) / total_processing_tasks
+            progress(overall_progress, desc=f"{progress_description_prefix}: {desc}")
+        try:
+            zip_file_path_single, status_message_single = _process_input_source_frames(
+                source_file_prefix=video_source_file_prefix,
+                frames_provider=video_frames_provider_generator(video_path_temp, sample_interval_ms),
+                is_video_source=True,
+                enable_person_detection=enable_person_detection,
+                min_target_width_person_percentage=min_target_width_person_percentage,
+                person_model_name=person_model_name,
+                person_conf_threshold=person_conf_threshold,
+                person_iou_threshold=person_iou_threshold,
+                enable_halfbody_detection=enable_halfbody_detection,
+                enable_halfbody_cropping=enable_halfbody_cropping,
+                min_target_width_halfbody_percentage=min_target_width_halfbody_percentage,
+                halfbody_model_name=halfbody_model_name,
+                halfbody_conf_threshold=halfbody_conf_threshold,
+                halfbody_iou_threshold=halfbody_iou_threshold,
+                enable_head_detection=enable_head_detection,
+                enable_head_cropping=enable_head_cropping,
+                min_crop_width_head_percentage=min_crop_width_head_percentage,
+                enable_head_filtering=enable_head_filtering,
+                head_model_name=head_model_name,
+                head_conf_threshold=head_conf_threshold,
+                head_iou_threshold=head_iou_threshold,
+                enable_face_detection=enable_face_detection,
+                enable_face_cropping=enable_face_cropping,
+                min_crop_width_face_percentage=min_crop_width_face_percentage,
+                enable_face_filtering=enable_face_filtering,
+                face_model_name=face_model_name,
+                face_conf_threshold=face_conf_threshold,
+                face_iou_threshold=face_iou_threshold,
+                enable_ccip_classification=enable_ccip_classification,
+                ccip_model_name=ccip_model_name,
+                ccip_threshold=ccip_threshold,
+                enable_lpips_clustering=enable_lpips_clustering,
+                lpips_threshold=lpips_threshold,
+                enable_aesthetic_analysis=enable_aesthetic_analysis,
+                aesthetic_model_name=aesthetic_model_name,
+                progress_updater=video_progress_updater
+            )
+            if zip_file_path_single:
+                output_zip_paths_all_sources.append(zip_file_path_single)
+                all_status_messages.append(f"--- Video ({video_original_filename}) Processing Succeeded ---\n{status_message_single}")
+            else:
+                all_status_messages.append(f"--- Video ({video_original_filename}) Processing Failed ---\n{status_message_single}")
+        except Exception as e_vid:
+            # This catches errors if process_video itself raises an unhandled exception
+            # (though process_video has its own try-except)
+            error_msg = f"Critical error during processing of video {video_original_filename}: {e_vid}"
+            print(error_msg)
+            traceback.print_exc()
+            all_status_messages.append(f"--- Video ({video_original_filename}) Processing CRITICALLY FAILED ---\n{error_msg}")
+        tasks_completed_count += 1
+        print(f">>> Finished attempt for Video: {video_original_filename} <<<")
+        # Gradio manages the lifecycle of video_path_temp (the uploaded temp file)
+    final_summary_message = "\n\n==============================\n\n".join(all_status_messages)
+    successful_zips_count = len(output_zip_paths_all_sources)
+    if successful_zips_count == 0 and total_processing_tasks > 0:
+        final_summary_message = f"ALL {total_processing_tasks} INPUT SOURCE(S) FAILED TO PRODUCE A ZIP FILE.\n\n" + final_summary_message
+    elif total_processing_tasks > 0:
+        final_summary_message = f"Successfully processed {successful_zips_count} out of {total_processing_tasks} input source(s).\n\n" + final_summary_message
+    else: # Should be caught earlier by "No processable files"
+        final_summary_message = "No inputs were processed."
+    progress(1.0, desc="All processing attempts finished.")
+    # gr.Files output expects a list of file paths. An empty list is fine if no files.
+    return output_zip_paths_all_sources, final_summary_message
+# --- Gradio Interface Setup ---
+css = """
+/* Default (Light Mode) Styles */
+#warning {
+    background-color: #FFCCCB; /* Light red background */
+    padding: 10px;
+    border-radius: 5px;
+    color: #A00000;        /* Dark red text */
+    border: 1px solid #E5B8B7; /* A slightly darker border for more definition */
+}
+/* Dark Mode Styles */
+@media (prefers-color-scheme: dark) {
+    #warning {
+        background-color: #5C1A1A; /* Darker red background, suitable for dark mode */
+        color: #FFDDDD;        /* Light pink text, for good contrast against the dark red background */
+        border: 1px solid #8B0000; /* A more prominent dark red border in dark mode */
+    }
+}
+#status_box {
+    white-space: pre-wrap !important; /* Ensure status messages show newlines */
+    font-family: monospace; /* Optional: Use monospace for better alignment */
+}
+"""
+# --- Define Model Lists ---
+person_models = ['person_detect_v1.3_s', 'person_detect_v1.2_s', 'person_detect_v1.1_s', 'person_detect_v1.1_m', 'person_detect_v1_m', 'person_detect_v1.1_n', 'person_detect_v0_s', 'person_detect_v0_m', 'person_detect_v0_x']
+halfbody_models = ['halfbody_detect_v1.0_s', 'halfbody_detect_v1.0_n', 'halfbody_detect_v0.4_s', 'halfbody_detect_v0.3_s', 'halfbody_detect_v0.2_s']
+head_models = ['head_detect_v2.0_s', 'head_detect_v2.0_m', 'head_detect_v2.0_n', 'head_detect_v2.0_x', 'head_detect_v2.0_s_yv11', 'head_detect_v2.0_m_yv11', 'head_detect_v2.0_n_yv11', 'head_detect_v2.0_x_yv11', 'head_detect_v2.0_l_yv11']
+face_models = ['face_detect_v1.4_s', 'face_detect_v1.4_n', 'face_detect_v1.3_s', 'face_detect_v1.3_n', 'face_detect_v1.2_s', 'face_detect_v1.1_s', 'face_detect_v1.1_n', 'face_detect_v1_s', 'face_detect_v1_n', 'face_detect_v0_s', 'face_detect_v0_n']
+ccip_models = ['ccip-caformer-24-randaug-pruned', 'ccip-caformer-6-randaug-pruned_fp32', 'ccip-caformer-5_fp32']
+aesthetic_models = ['swinv2pv3_v0_448_ls0.2_x', 'swinv2pv3_v0_448_ls0.2', 'caformer_s36_v0_ls0.2']
+with gr.Blocks(css=css) as demo:
+    gr.Markdown("# Video Processor using dghs-imgutils")
+    gr.Markdown("Upload one or more videos, or a sequence of images. Videos are processed individually, while multiple images are treated as a single sequence. Each processed source (video or image sequence) is then sequentially analyzed by [dghs-imgutils](https://github.com/deepghs/imgutils) to detect subjects, classify items, and process its content according to your settings, ultimately generating a ZIP file with the extracted images.")
+    gr.Markdown("**Detection Flow:** " +
+                "[Person](https://dghs-imgutils.deepghs.org/main/api_doc/detect/person.html) ⇒ " +
+                "[Half-Body](https://dghs-imgutils.deepghs.org/main/api_doc/detect/halfbody.html) (if no person) ⇒ " +
+                "[Face](https://dghs-imgutils.deepghs.org/main/api_doc/detect/face.html) (on target) ⇒ " +
+                "[Head](https://dghs-imgutils.deepghs.org/main/api_doc/detect/head.html) (on target).")
+    gr.Markdown("**Analysis Flow:** " +
+                "[CCIP](https://dghs-imgutils.deepghs.org/main/api_doc/metrics/ccip.html) Clustering ⇒ " +
+                "[LPIPS](https://dghs-imgutils.deepghs.org/main/api_doc/metrics/lpips.html) Clustering ⇒ " +
+                "[Aesthetic](https://dghs-imgutils.deepghs.org/main/api_doc/metrics/dbaesthetic.html) Labeling.")
+    gr.Markdown("**Note on CCIP Folders:** CCIP cluster folders are named `{source_prefix}_ccip_XXX`, sorted by image count (most images = `_ccip_000`).")
+    gr.Markdown("**Note on LPIPS Folders:** LPIPS cluster folders (e.g., `lpips_XXX` or `lpips_sub_XXX`) are also sorted by image count within their scope. 'noise' folders are named explicitly.")
+    with gr.Row():
+        with gr.Column(scale=1):
+            # --- Input Components ---
+            process_button = gr.Button("Process Input(s) & Generate ZIP(s)", variant="primary")
+            input_files = gr.Files(label="Upload Videos or Image Sequences", file_types=['video', 'image'], file_count="multiple")
+            sample_interval_ms = gr.Number(label="Sample Interval (ms, for videos)", value=1000, minimum=1, step=100)
+            # --- Detection Options ---
+            gr.Markdown("**Detection Options**")
+            # --- Person Detection Block ---
+            with gr.Accordion("Person Detection Options", open=True):
+                enable_person_detection = gr.Checkbox(label="Enable Person Detection", value=True)
+                with gr.Group() as person_detection_params_group:
+                    min_target_width_person_percentage_slider = gr.Slider(
+                        minimum=0.0, maximum=1.0, value=0.25, step=0.01,
+                        label="Min Target Width (% of Item Width)",
+                        info="Minimum width for a detected person to be processed (e.g., 0.25 = 25%)."
+                    )
+                    person_model_name_dd = gr.Dropdown(person_models, label="PD Model", value=person_models[0])
+                    person_conf_threshold = gr.Slider(0.0, 1.0, value=0.3, step=0.05, label="PD Conf")
+                    person_iou_threshold = gr.Slider(0.0, 1.0, value=0.5, step=0.05, label="PD IoU")
+                enable_person_detection.change(fn=lambda e: gr.update(visible=e), inputs=enable_person_detection, outputs=person_detection_params_group)
+            # --- Half-Body Detection Block ---
+            with gr.Accordion("Half-Body Detection Options", open=True):
+                enable_halfbody_detection = gr.Checkbox(label="Enable Half-Body Detection", value=True)
+                with gr.Group() as halfbody_params_group:
+                    gr.Markdown("<small>_Detects half-bodies in full items if Person Detection is off/fails._</small>")
+                    enable_halfbody_cropping = gr.Checkbox(label="Use Half-Bodies as Targets", value=True)
+                    min_target_width_halfbody_percentage_slider = gr.Slider(
+                        minimum=0.0, maximum=1.0, value=0.25, step=0.01,
+                        label="Min Target Width (% of Item Width)",
+                        info="Minimum width for a detected half-body to be processed (e.g., 0.25 = 25%)."
+                    )
+                    halfbody_model_name_dd = gr.Dropdown(halfbody_models, label="HBD Model", value=halfbody_models[0])
+                    halfbody_conf_threshold = gr.Slider(0.0, 1.0, value=0.5, step=0.05, label="HBD Conf")
+                    halfbody_iou_threshold = gr.Slider(0.0, 1.0, value=0.7, step=0.05, label="HBD IoU")
+                enable_halfbody_detection.change(fn=lambda e: gr.update(visible=e), inputs=enable_halfbody_detection, outputs=halfbody_params_group)
+            # --- Face Detection Block ---
+            with gr.Accordion("Face Detection Options", open=True):
+                enable_face_detection = gr.Checkbox(label="Enable Face Detection", value=True)
+                with gr.Group() as face_params_group:
+                    enable_face_filtering = gr.Checkbox(label="Filter Targets Without Detected Faces", value=True)
+                    enable_face_cropping = gr.Checkbox(label="Crop Detected Faces", value=False)
+                    min_crop_width_face_percentage_slider = gr.Slider(
+                        minimum=0.0, maximum=1.0, value=0.2, step=0.01,
+                        label="Min Crop Width (% of Parent Width)",
+                        info="Minimum width for a face crop relative to its parent image's width (e.g., 0.2 = 20%)."
+                    )
+                    face_model_name_dd = gr.Dropdown(face_models, label="FD Model", value=face_models[0])
+                    face_conf_threshold = gr.Slider(0.0, 1.0, value=0.25, step=0.05, label="FD Conf")
+                    face_iou_threshold = gr.Slider(0.0, 1.0, value=0.7, step=0.05, label="FD IoU")
+                enable_face_detection.change(fn=lambda e: gr.update(visible=e), inputs=enable_face_detection, outputs=face_params_group)
+            # --- Head Detection Block ---
+            with gr.Accordion("Head Detection Options", open=True):
+                enable_head_detection = gr.Checkbox(label="Enable Head Detection", value=True)
+                with gr.Group() as head_params_group:
+                    gr.Markdown("<small>_Detects heads in targets. Crops if meets width req._</small>")
+                    enable_head_filtering = gr.Checkbox(label="Filter Targets Without Heads", value=True)
+                    enable_head_cropping = gr.Checkbox(label="Crop Detected Heads", value=False)
+                    min_crop_width_head_percentage_slider = gr.Slider(
+                        minimum=0.0, maximum=1.0, value=0.2, step=0.01,
+                        label="Min Crop Width (% of Parent Width)",
+                        info="Minimum width for a head crop relative to its parent image's width (e.g., 0.2 = 20%)."
+                    )
+                    head_model_name_dd = gr.Dropdown(head_models, label="HD Model", value=head_models[0])
+                    head_conf_threshold = gr.Slider(0.0, 1.0, value=0.4, step=0.05, label="HD Conf")
+                    head_iou_threshold = gr.Slider(0.0, 1.0, value=0.7, step=0.05, label="HD IoU")
+                enable_head_detection.change(fn=lambda e: gr.update(visible=e), inputs=enable_head_detection, outputs=head_params_group)
+            # --- Analysis/Classification Options ---
+            gr.Markdown("**Analysis & Classification**")
+            # --- CCIP Classification Block ---
+            with gr.Accordion("CCIP Classification Options", open=True):
+                 enable_ccip_classification = gr.Checkbox(label="Enable CCIP Classification", value=True)
+                 with gr.Group() as ccip_params_group:
+                    gr.Markdown("<small>_Clusters results by similarity. Folders sorted by image count._</small>")
+                    ccip_model_name_dd = gr.Dropdown(ccip_models, label="CCIP Model", value=ccip_models[0])
+                    ccip_threshold_slider = gr.Slider(0.0, 1.0, step=0.01, value=0.20, label="CCIP Similarity Threshold")
+                 enable_ccip_classification.change(fn=lambda e: gr.update(visible=e), inputs=enable_ccip_classification, outputs=ccip_params_group)
+            # LPIPS Clustering Options
+            with gr.Accordion("LPIPS Clustering Options", open=True):
+                enable_lpips_clustering = gr.Checkbox(label="Enable LPIPS Clustering", value=True)
+                with gr.Group() as lpips_params_group:
+                    gr.Markdown("<small>_Clusters images by LPIPS similarity. Applied after CCIP (if enabled) or globally. Folders sorted by image count._</small>")
+                    lpips_threshold_slider = gr.Slider(0.0, 1.0, step=0.01, value=0.45, label="LPIPS Similarity Threshold")
+                enable_lpips_clustering.change(fn=lambda e: gr.update(visible=e), inputs=enable_lpips_clustering, outputs=lpips_params_group)
+            # --- Aesthetic Analysis Block ---
+            with gr.Accordion("Aesthetic Analysis Options", open=True):
+                 enable_aesthetic_analysis = gr.Checkbox(label="Enable Aesthetic Analysis (Anime)", value=True)
+                 with gr.Group() as aesthetic_params_group:
+                     gr.Markdown("<small>_Prepends aesthetic label to filenames._</small>")
+                     aesthetic_model_name_dd = gr.Dropdown(aesthetic_models, label="Aesthetic Model", value=aesthetic_models[0])
+                 enable_aesthetic_analysis.change(fn=lambda e: gr.update(visible=e), inputs=enable_aesthetic_analysis, outputs=aesthetic_params_group)
+            gr.Markdown("---")
+            gr.Markdown("**Warning:** Complex combinations can be slow. Models downloaded on first use.", elem_id="warning")
+        with gr.Column(scale=1):
+            # --- Output Components ---
+            status_text = gr.Textbox(label="Processing Status", interactive=False, lines=20, elem_id="status_box")
+            output_zips = gr.Files(label="Download Processed Images (ZIPs)")
+    # Connect button click
+    process_button.click(
+        fn=process_inputs_main,
+        inputs=[
+            input_files, sample_interval_ms,
+            # Person Detect
+            enable_person_detection, min_target_width_person_percentage_slider,
+            person_model_name_dd, person_conf_threshold, person_iou_threshold,
+            # HalfBody Detect
+            enable_halfbody_detection, enable_halfbody_cropping, min_target_width_halfbody_percentage_slider,
+            halfbody_model_name_dd, halfbody_conf_threshold, halfbody_iou_threshold,
+            # Head Detect
+            enable_head_detection, enable_head_cropping, min_crop_width_head_percentage_slider,
+            enable_head_filtering, head_model_name_dd, head_conf_threshold, head_iou_threshold,
+            # Face Detect
+            enable_face_detection, enable_face_cropping, min_crop_width_face_percentage_slider,
+            enable_face_filtering, face_model_name_dd, face_conf_threshold, face_iou_threshold,
+            # CCIP
+            enable_ccip_classification, ccip_model_name_dd, ccip_threshold_slider,
+            # LPIPS
+            enable_lpips_clustering, lpips_threshold_slider,
+            # Aesthetic
+            enable_aesthetic_analysis, aesthetic_model_name_dd,
+        ],
+        outputs=[output_zips, status_text]
+    )
+# --- Launch Script ---
+if __name__ == "__main__":
+    print("Starting Gradio App...")
+    # Model pre-check
+    try:
+        print("Checking/Downloading models (this might take a moment)...")
+        # Use simple, small images for checks
+        dummy_img_pil = Image.new('RGB', (64, 64), color = 'orange')
+        print("  - Person detection...")
+        _ = person_detector.detect_person(dummy_img_pil, model_name=person_models[0])
+        print("  - HalfBody detection...")
+        _ = halfbody_detector.detect_halfbody(dummy_img_pil, model_name=halfbody_models[0])
+        print("  - Head detection...")
+        _ = head_detector.detect_heads(dummy_img_pil, model_name=head_models[0])
+        print("  - Face detection...")
+        _ = face_detector.detect_faces(dummy_img_pil, model_name=face_models[0])
+        print("  - CCIP feature extraction...")
+        _ = ccip_analyzer.ccip_extract_feature(dummy_img_pil, size=384, model=ccip_models[0])
+        print("  - LPIPS feature extraction...")
+        _ = lpips_module.lpips_extract_feature(dummy_img_pil)
+        print("  - Aesthetic analysis...")
+        _ = dbaesthetic_analyzer.anime_dbaesthetic(dummy_img_pil, model_name=aesthetic_models[0])
+        print("Models seem ready or downloaded.")
+        del dummy_img_pil
+        gc.collect()
+    except Exception as model_err:
+        print(f"\n--- !!! WARNING !!! ---")
+        print(f"Could not pre-check/download all models: {model_err}")
+        print(f"Models will be downloaded when first used by the application, which may cause a delay on the first run.")
+        print(f"Check your internet connection and library installation (pip install \"dghs-imgutils[gpu]\").")
+        print(f"-----------------------\n")
+    # Launch the app
+    demo.launch(inbrowser=True)

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ gradio==5.29.0
2	+ dghs-imgutils[gpu]

webui.bat ADDED Viewed

	@@ -0,0 +1,73 @@

+@echo off
+:: The source of the webui.bat file is stable-diffusion-webui
+:: set COMMANDLINE_ARGS=--whisper_implementation faster-whisper --input_audio_max_duration -1 --default_model_name large-v2 --auto_parallel True --output_dir output --vad_max_merge_size 90 --save_downloaded_files --autolaunch
+if not defined PYTHON (set PYTHON=python)
+if not defined VENV_DIR (set "VENV_DIR=%~dp0%venv")
+mkdir tmp 2>NUL
+%PYTHON% -c "" >tmp/stdout.txt 2>tmp/stderr.txt
+if %ERRORLEVEL% == 0 goto :check_pip
+echo Couldn't launch python
+goto :show_stdout_stderr
+:check_pip
+%PYTHON% -mpip --help >tmp/stdout.txt 2>tmp/stderr.txt
+if %ERRORLEVEL% == 0 goto :start_venv
+if "%PIP_INSTALLER_LOCATION%" == "" goto :show_stdout_stderr
+%PYTHON% "%PIP_INSTALLER_LOCATION%" >tmp/stdout.txt 2>tmp/stderr.txt
+if %ERRORLEVEL% == 0 goto :start_venv
+echo Couldn't install pip
+goto :show_stdout_stderr
+:start_venv
+if ["%VENV_DIR%"] == ["-"] goto :skip_venv
+if ["%SKIP_VENV%"] == ["1"] goto :skip_venv
+dir "%VENV_DIR%\Scripts\Python.exe" >tmp/stdout.txt 2>tmp/stderr.txt
+if %ERRORLEVEL% == 0 goto :activate_venv
+for /f "delims=" %%i in ('CALL %PYTHON% -c "import sys; print(sys.executable)"') do set PYTHON_FULLNAME="%%i"
+echo Creating venv in directory %VENV_DIR% using python %PYTHON_FULLNAME%
+%PYTHON_FULLNAME% -m venv "%VENV_DIR%" >tmp/stdout.txt 2>tmp/stderr.txt
+if %ERRORLEVEL% == 0 goto :activate_venv
+echo Unable to create venv in directory "%VENV_DIR%"
+goto :show_stdout_stderr
+:activate_venv
+set PYTHON="%VENV_DIR%\Scripts\Python.exe"
+echo venv %PYTHON%
+:skip_venv
+goto :launch
+:launch
+%PYTHON% app.py %COMMANDLINE_ARGS% %*
+pause
+exit /b
+:show_stdout_stderr
+echo.
+echo exit code: %errorlevel%
+for /f %%i in ("tmp\stdout.txt") do set size=%%~zi
+if %size% equ 0 goto :show_stderr
+echo.
+echo stdout:
+type tmp\stdout.txt
+:show_stderr
+for /f %%i in ("tmp\stderr.txt") do set size=%%~zi
+if %size% equ 0 goto :show_stderr
+echo.
+echo stderr:
+type tmp\stderr.txt
+:endofscript
+echo.
+echo Launch unsuccessful. Exiting.
+pause