Spaces:

hpi-dhc
/

FairEval

Runtime error

App Files Files Community

illorca commited on Dec 12, 2022

Commit

6a56d7d

1 Parent(s): 68b945f

Update Readme

Browse files

Files changed (1) hide show

README.md +29 -46

README.md CHANGED Viewed

@@ -3,7 +3,7 @@ title: FairEval
 tags:
 - evaluate
 - metric
-description: "TODO: add a description here"
 sdk: gradio
 sdk_version: 3.0.2
 app_file: app.py
@@ -82,59 +82,42 @@ Considering the following input annotated sentences:
 The output for different modes and error_formats is:
 ```python
 >>> faireval.compute(predictions=y_pred, references=y_true, mode='fair', error_format='count')
-{"PER": {"precision": 1.0,"recall": 0.5,"f1": 0.6666,
-         "trad_prec": 0.5,"trad_rec": 0.5,"trad_f1": 0.5,
-         "TP": 1,"FP": 0.0,"FN": 1.0,"LE": 0.0,"BE": 0.0,"LBE": 0.0},
- "INT": {"precision": 0.0,"recall": 0.0,"f1": 0.0,
-         "trad_prec": 0.0,"trad_rec": 0.0,"trad_f1": 0.0,
-         "TP": 0,"FP": 0.0,"FN": 0.0,"LE": 0.0,"BE": 1.0,"LBE": 1.0},
- "OUT": {"precision": 0.6666,"recall": 0.6666,"f1": 0.666,
-         "trad_prec": 0.5,"trad_rec": 0.5,"trad_f1": 0.5,
-         "TP": 1,"FP": 0.0,"FN": 0.0,"LE": 1.0,"BE": 0.0,"LBE": 0.0},
- "overall_precision": 0.5714,
- "overall_recall": 0.4444,
- "overall_f1": 0.5,
- "overall_trad_prec": 0.4,
- "overall_trad_rec": 0.3333,
- "overall_trad_f1": 0.3636,
- "TP": 2,
- "FP": 0.0,
- "FN": 1.0,
- "LE": 1.0,
- "BE": 1.0,
- "LBE": 1.0}
 ```
 ```python
 >>> faireval.compute(predictions=y_pred, references=y_true, mode='traditional', error_format='count')
-{"PER": {"precision": 0.5,"recall": 0.5,"f1": 0.5,
-         "TP": 1,"FP": 1.0,"FN": 1.0},
- "INT": {"precision": 0.0,"recall": 0.0,"f1": 0.0,
-         "TP": 0,"FP": 1.0,"FN": 2.0},
- "OUT": {"precision": 0.5,"recall": 0.5,"f1": 0.5,
-         "TP": 1,"FP": 1.0,"FN": 1.0},
- "overall_precision": 0.4,
- "overall_recall": 0.3333,
- "overall_f1": 0.3636,
- "TP": 2,
- "FP": 3.0,
- "FN": 4.0}
 ```
 ```python
 >>> faireval.compute(predictions=y_pred, references=y_true, mode='traditional', error_format='error_ratio')
-{"PER": {"precision": 0.5,"recall": 0.5,"f1": 0.5,
-         "TP": 1,"FP": 0.1428,"FN": 0.1428},
- "INT": {"precision": 0.0,"recall": 0.0,"f1": 0.0,
-         "TP": 0,"FP": 0.14285714285714285,"FN": 0.2857},
- "OUT": {"precision": 0.5,"recall": 0.5,"f1": 0.5,
-         "TP": 1,"FP": 0.1428,"FN": 0.1428},
- "overall_precision": 0.4,
- "overall_recall": 0.3333,
- "overall_f1": 0.3636,
- "TP": 2,
- "FP": 0.4285,
- "FN": 0.5714}
 ```
 #### Values from Popular Papers

 tags:
 - evaluate
 - metric
+description: "Fair Evaluation for Squence labeling"
 sdk: gradio
 sdk_version: 3.0.2
 app_file: app.py
 The output for different modes and error_formats is:
 ```python
 >>> faireval.compute(predictions=y_pred, references=y_true, mode='fair', error_format='count')
+{"PER": {"precision": 1.0, "recall": 0.5, "f1": 0.6666,
+         "trad_prec": 0.5, "trad_rec": 0.5, "trad_f1": 0.5,
+         "TP": 1, "FP": 0.0, "FN": 1.0, "LE": 0.0, "BE": 0.0, "LBE": 0.0},
+ "INT": {"precision": 0.0, "recall": 0.0, "f1": 0.0,
+         "trad_prec": 0.0, "trad_rec": 0.0, "trad_f1": 0.0,
+         "TP": 0, "FP": 0.0, "FN": 0.0, "LE": 0.0, "BE": 1.0, "LBE": 1.0},
+ "OUT": {"precision": 0.6666, "recall": 0.6666, "f1": 0.666,
+         "trad_prec": 0.5, "trad_rec": 0.5, "trad_f1": 0.5,
+         "TP": 1, "FP": 0.0, "FN": 0.0, "LE": 1.0, "BE": 0.0, "LBE": 0.0},
+ "overall_precision": 0.5714, "overall_recall": 0.4444, "overall_f1": 0.5,
+ "overall_trad_prec": 0.4, "overall_trad_rec": 0.3333, "overall_trad_f1": 0.3636,
+ "TP": 2, "FP": 0.0, "FN": 1.0, "LE": 1.0, "BE": 1.0, "LBE": 1.0}
 ```
 ```python
 >>> faireval.compute(predictions=y_pred, references=y_true, mode='traditional', error_format='count')
+{"PER": {"precision": 0.5, "recall": 0.5, "f1": 0.5,
+         "TP": 1, "FP": 1.0, "FN": 1.0},
+ "INT": {"precision": 0.0, "recall": 0.0, "f1": 0.0,
+         "TP": 0, "FP": 1.0, "FN": 2.0},
+ "OUT": {"precision": 0.5, "recall": 0.5, "f1": 0.5,
+         "TP": 1, "FP": 1.0, "FN": 1.0},
+ "overall_precision": 0.4, "overall_recall": 0.3333, "overall_f1": 0.3636,
+ "TP": 2, "FP": 3.0, "FN": 4.0}
 ```
 ```python
 >>> faireval.compute(predictions=y_pred, references=y_true, mode='traditional', error_format='error_ratio')
+{"PER": {"precision": 0.5, "recall": 0.5, "f1": 0.5,
+         "TP": 1, "FP": 0.1428, "FN": 0.1428},
+ "INT": {"precision": 0.0, "recall": 0.0, "f1": 0.0,
+         "TP": 0, "FP": 0.1428, "FN": 0.2857},
+ "OUT": {"precision": 0.5, "recall": 0.5, "f1": 0.5,
+         "TP": 1, "FP": 0.1428, "FN": 0.1428},
+ "overall_precision": 0.4, "overall_recall": 0.3333, "overall_f1": 0.3636,
+ "TP": 2, "FP": 0.4285, "FN": 0.5714}
 ```
 #### Values from Popular Papers