Spaces:

holistic-ai
/

explainbility_benchmark

Sleeping

Zekun Wu commited on May 13, 2024

Commit

da04c4f

1 Parent(s): 2316f10

update

Files changed (1) hide show

util/evaluator.py CHANGED Viewed

@@ -59,7 +59,7 @@ class evaluator:
         """
         response = self.model.invoke(evaluation_prompt,temperature=0.8, max_tokens=60).strip()
-        #response = """        {{"Factually Correct": 0.9,"Useful": 0.85,"Context Specific": 0.8,"User Specific": 0.75,"Provides Pluralism": 0.7}}"""
         print(response)
         try:
             scores = json.loads(response)
@@ -71,7 +71,8 @@ class evaluator:
                 scores = json.loads(repaired_json)
             except json.JSONDecodeError:
                 print("Failed to decode JSON response even after repair attempt. Skipping this batch.")
-                return None
         return self.validate_scores(scores)

         """
         response = self.model.invoke(evaluation_prompt,temperature=0.8, max_tokens=60).strip()
+        #response = """{{"Factually Correct": 0.9,"Useful": 0.85,"Context Specific": 0.8,"User Specific": 0.75,"Provides Pluralism": 0.7}}"""
         print(response)
         try:
             scores = json.loads(response)
                 scores = json.loads(repaired_json)
             except json.JSONDecodeError:
                 print("Failed to decode JSON response even after repair attempt. Skipping this batch.")
+                return {"Factually Correct": -1,"Useful": -1,"Context Specific": -1,"User Specific":-1,"Provides Pluralism":-1}
         return self.validate_scores(scores)