Spaces:

VyLala
/

mtDNALocation

Running

App Files Files Community

VyLala commited on 12 days ago

Commit

9cbd44c

verified ·

1 Parent(s): b10f2c3

Update model.py

Browse files

Files changed (1) hide show

model.py +27 -7

model.py CHANGED Viewed

@@ -865,10 +865,13 @@ def parse_multi_sample_llm_output(raw_response: str, output_format_str):
     metadata_list = {}
     explanation_lines = []
     output_answers = raw_response.split("\n")[0].split(", ")
     if ". " in raw_response.split("\n")[1] and len(raw_response.split("\n")[1].split(". ")) > 1:
         explanation_lines =  [x for x in raw_response.split(". ")[1] if x.strip()]
     else:
         explanation_lines =  [x for x in raw_response.split("\n")[1:] if x.strip()]
     output_formats = output_format_str.split(", ")
     explain = ""
     # assign output format to its output answer and explanation
@@ -1209,16 +1212,33 @@ def query_document_info(query_word, alternative_query_word, metadata, master_str
 #     f"Output Format: {output_format_str}"
 # )
         prompt_for_llm = (
     f"{prompt_instruction_prefix}"
-    f"Given the following text snippets, analyze the entity/concept {rag_query_phrase} or the mitochondrial DNA sample in {organism} if these specific identifiers are not explicitly found. "
-    f"Identify its primary associated country/geographic location. "
-    f"Also, determine if the genetic sample or individual mentioned is from a 'modern' (present-day living individual) "
-    f"or 'ancient' (e.g., prehistoric remains, archaeological sample) source. "
-    f"If the text does not mention whether the sample is ancient or modern, assume the sample is modern unless otherwise explicitly described as ancient or archaeological. "
     f"Provide only {output_format_str}. "
-    f"If any information is not explicitly present in the provided text snippets, state 'unknown' for that specific piece of information. "
-    f"If the {explain_list} is not 'unknown', write 1 sentence after the output explaining how you inferred it from the text (one sentence for each)."
     f"\n\nText Snippets:\n{context_for_llm}\n\n"
     f"Output Format: {output_format_str}"
 )

     metadata_list = {}
     explanation_lines = []
     output_answers = raw_response.split("\n")[0].split(", ")
+    print("raw explanation line: raw_response.split("\n")[1]")
     if ". " in raw_response.split("\n")[1] and len(raw_response.split("\n")[1].split(". ")) > 1:
         explanation_lines =  [x for x in raw_response.split(". ")[1] if x.strip()]
+        print("explain line split by dot: ", explanation_lines)
     else:
         explanation_lines =  [x for x in raw_response.split("\n")[1:] if x.strip()]
+        print("explain line split by new line: ", explanation_lines)
     output_formats = output_format_str.split(", ")
     explain = ""
     # assign output format to its output answer and explanation
 #     f"Output Format: {output_format_str}"
 # )
+#         prompt_for_llm = (
+#     f"{prompt_instruction_prefix}"
+#     f"Given the following text snippets, analyze the entity/concept {rag_query_phrase} or the mitochondrial DNA sample in {organism} if these specific identifiers are not explicitly found. "
+#     f"Identify its primary associated country/geographic location. "
+#     f"Also, determine if the genetic sample or individual mentioned is from a 'modern' (present-day living individual) "
+#     f"or 'ancient' (e.g., prehistoric remains, archaeological sample) source. "
+#     f"If the text does not mention whether the sample is ancient or modern, assume the sample is modern unless otherwise explicitly described as ancient or archaeological. "
+#     f"Provide only {output_format_str}. "
+#     f"If any information is not explicitly present in the provided text snippets, state 'unknown' for that specific piece of information. "
+#     f"If the {explain_list} is not 'unknown', write 1 sentence after the output explaining how you inferred it from the text (one sentence for each)."
+#     f"\n\nText Snippets:\n{context_for_llm}\n\n"
+#     f"Output Format: {output_format_str}"
+# )
         prompt_for_llm = (
     f"{prompt_instruction_prefix}"
+    f"Given the following text snippets, analyze the entity/concept {rag_query_phrase} "
+    f"or the mitochondrial DNA sample in {organism} if these identifiers are not explicitly found. "
+    f"Identify its **primary associated geographic location**, preferring the most specific available: "
+    f"first try to determine the exact country; if no country is explicitly mentioned, then provide "
+    f"the next most specific region, continent, island, or other clear geographic area mentioned. "
+    f"If no geographic clues at all are present, state 'unknown' for location. "
+    f"Also, determine if the genetic sample is from a 'modern' (present-day living individual) "
+    f"or 'ancient' (prehistoric/archaeological) source. "
+    f"If the text does not specify ancient or archaeological context, assume 'modern'. "
     f"Provide only {output_format_str}. "
+    f"If any information is not explicitly present, use the fallback rules above before defaulting to 'unknown'. "
+    f"For each non-'unknown' field in {explain_list}, write one sentence explaining how it was inferred from the text (one sentence for each)."
     f"\n\nText Snippets:\n{context_for_llm}\n\n"
     f"Output Format: {output_format_str}"
 )