Spaces:

venkatasg
/

gleu

Runtime error

App Files Files Community

venkatasg commited on Jul 5, 2024

Commit

91c44b6

1 Parent(s): ca6b0e0

mean and stdev

Browse files

Files changed (1) hide show

gleu.py +10 -7

gleu.py CHANGED Viewed

@@ -18,6 +18,7 @@ import datasets
 from collections import Counter
 from math import log, exp
 from random import seed, randint
 # TODO: Add BibTeX citation
@@ -49,7 +50,8 @@ Args:
     references: Reference for each prediction. Each reference should be a string with tokens separated by spaces.
     predictions: list of predictions to score. Each prediction should be a string with tokens separated by spaces.
 Returns:
-    gleu_score: Average gleu_score over all predictions.
 Examples:
@@ -57,15 +59,15 @@ Examples:
     >>> references=["We may in actual fact be communicating with a hoax Facebook acccount of a cyberfriend , which we assume to be real but in reality , it is a fake account ."]
     >>> results = my_new_module.compute(references=references, predictions=["We may of actual fact communicating with a hoax Facebook acccount of a cyber friend , which we assumed to be real but in reality , it is a fake account ."])
     >>> print(results)
-    {'gleu_score': 0.6}
     >>> results = my_new_module.compute(references=references, predictions=["We may be in actual fact communicating with a hoax Facebook acccount of a cyber friend , we assume to be real but in reality , it is a fake account ."])
     >>> print(results)
-    {'gleu_score': 0.62}
     >>> results = my_new_module.compute(references=references, predictions=["We may in actual fact communicating with a hoax Facebook account of a cyber friend , which we assume to be real but in reality , it is a fake accounts ."])
     >>> print(results)
-    {'gleu_score': 0.64}
 """
@@ -239,6 +241,7 @@ class gleu(evaluate.Metric):
                 iter_stats[j] = [sum(scores) for scores in zip(iter_stats[j], this_stats)]
-        final_gleu_score = get_gleu_stats([gleu_calculator.compute_gleu(stats)
-          for stats in iter_stats ])[0]
-        return {"gleu_score": final_gleu_score}

 from collections import Counter
 from math import log, exp
 from random import seed, randint
+from numpy import mean, std, round
 # TODO: Add BibTeX citation
     references: Reference for each prediction. Each reference should be a string with tokens separated by spaces.
     predictions: list of predictions to score. Each prediction should be a string with tokens separated by spaces.
 Returns:
+    mean_gleu_score: Average gleu_score over all predictions.
+    SD: standard deviation
 Examples:
     >>> references=["We may in actual fact be communicating with a hoax Facebook acccount of a cyberfriend , which we assume to be real but in reality , it is a fake account ."]
     >>> results = my_new_module.compute(references=references, predictions=["We may of actual fact communicating with a hoax Facebook acccount of a cyber friend , which we assumed to be real but in reality , it is a fake account ."])
     >>> print(results)
+    {'mean_gleu_score': 0.6}
     >>> results = my_new_module.compute(references=references, predictions=["We may be in actual fact communicating with a hoax Facebook acccount of a cyber friend , we assume to be real but in reality , it is a fake account ."])
     >>> print(results)
+    {'mean_gleu_score': 0.62}
     >>> results = my_new_module.compute(references=references, predictions=["We may in actual fact communicating with a hoax Facebook account of a cyber friend , which we assume to be real but in reality , it is a fake accounts ."])
     >>> print(results)
+    {'mean_gleu_score': 0.64}
 """
                 iter_stats[j] = [sum(scores) for scores in zip(iter_stats[j], this_stats)]
+        sent_scores = [gleu_calculator.compute_gleu(stats) for stats in iter_stats]
+        mean_score = round(mean(sent_scores),2)
+        std_score = round(std(sent_scores),2)
+        return {"mean_gleu_score": mean_score, 'SD': std_score}