Spaces:

VyLala
/

mtDNALocation

Running

App Files Files Community

VyLala commited on 8 days ago

Commit

a63f173

verified ·

1 Parent(s): dd66f82

Update model.py

Browse files

Files changed (1) hide show

model.py +52 -7

model.py CHANGED Viewed

@@ -935,12 +935,29 @@ def merge_metadata_outputs(metadata_list):
     return merged
-def query_document_info(query_word, alternative_query_word, metadata, master_structured_lookup, faiss_index, document_chunks, llm_api_function, chunk=None, all_output=None):
     """
     Queries the document using a hybrid approach:
     1. Local structured lookup (fast, cheap, accurate for known patterns).
     2. RAG with semantic search and LLM (general, flexible, cost-optimized).
     """
     if metadata:
       extracted_country, extracted_specific_location, extracted_ethnicity, extracted_type = metadata["country"], metadata["specific_location"], metadata["ethnicity"], metadata["sample_type"]
       extracted_col_date, extracted_iso, extracted_title, extracted_features = metadata["collection_date"], metadata["isolate"], metadata["title"], metadata["all_features"]
@@ -1097,7 +1114,6 @@ def query_document_info(query_word, alternative_query_word, metadata, master_str
     # run_rag = (extracted_country == 'unknown' or extracted_type == 'unknown')# or \
     #            #extracted_ethnicity == 'unknown' or extracted_specific_location == 'unknown')
     run_rag = True
-    global_llm_model_for_counting_tokens = genai.GenerativeModel("gemini-2.5-flash-lite")#('gemini-1.5-flash-latest')
     if run_rag:
         print("try run rag")
         # Determine the phrase for LLM query
@@ -1239,6 +1255,23 @@ def query_document_info(query_word, alternative_query_word, metadata, master_str
 #     f"If the {explain_list} is not 'unknown', write 1 sentence after the output explaining how you inferred it from the text (one sentence for each)."
 #     f"\n\nText Snippets:\n{context_for_llm}\n\n"
 #     f"Output Format: {output_format_str}"
 # )
         prompt_for_llm = (
     f"{prompt_instruction_prefix}"
@@ -1253,12 +1286,24 @@ def query_document_info(query_word, alternative_query_word, metadata, master_str
     f"If the text does not specify ancient or archaeological context, assume 'modern'. "
     f"Provide only {output_format_str}. "
     f"If any information is not explicitly present, use the fallback rules above before defaulting to 'unknown'. "
-    f"For each non-'unknown' field in {explain_list}, write one sentence explaining how it was inferred from the text (one sentence for each)."
-    f"\n\nText Snippets:\n{context_for_llm}\n\n"
-    f"Output Format: {output_format_str}"
 )
-        llm_response_text, model_instance = call_llm_api(prompt_for_llm)
         print("\n--- DEBUG INFO FOR RAG ---")
         print("Retrieved Context Sent to LLM (first 500 chars):")
         print(context_for_llm[:500] + "..." if len(context_for_llm) > 500 else context_for_llm)

     return merged
+def query_document_info(query_word, alternative_query_word, metadata, master_structured_lookup, faiss_index, document_chunks, llm_api_function, chunk=None, all_output=None, model_ai=None):
     """
     Queries the document using a hybrid approach:
     1. Local structured lookup (fast, cheap, accurate for known patterns).
     2. RAG with semantic search and LLM (general, flexible, cost-optimized).
     """
+    if model_ai:
+      if model_ai == "gemini-1.5-flash-latest":
+        genai.configure(api_key=os.getenv("GOOGLE_API_KEY"))
+        PRICE_PER_1K_INPUT_LLM = 0.000075  # $0.075 per 1M tokens
+        PRICE_PER_1K_OUTPUT_LLM = 0.0003   # $0.30 per 1M tokens
+        PRICE_PER_1K_EMBEDDING_INPUT = 0.000025 # $0.025 per 1M tokens
+        global_llm_model_for_counting_tokens = genai.GenerativeModel("gemini-1.5-flash-latest")#('gemini-1.5-flash-latest')
+    else:
+      genai.configure(api_key=os.getenv("GOOGLE_API_KEY_BACKUP"))
+      # Gemini 2.5 Flash-Lite pricing per 1,000 tokens
+      PRICE_PER_1K_INPUT_LLM = 0.00010      # $0.10 per 1M input tokens
+      PRICE_PER_1K_OUTPUT_LLM = 0.00040     # $0.40 per 1M output tokens
+      # Embedding-001 pricing per 1,000 input tokens
+      PRICE_PER_1K_EMBEDDING_INPUT = 0.00015  # $0.15 per 1M input tokens
+      global_llm_model_for_counting_tokens = genai.GenerativeModel("gemini-2.5-flash-lite")#('gemini-1.5-flash-latest')
     if metadata:
       extracted_country, extracted_specific_location, extracted_ethnicity, extracted_type = metadata["country"], metadata["specific_location"], metadata["ethnicity"], metadata["sample_type"]
       extracted_col_date, extracted_iso, extracted_title, extracted_features = metadata["collection_date"], metadata["isolate"], metadata["title"], metadata["all_features"]
     # run_rag = (extracted_country == 'unknown' or extracted_type == 'unknown')# or \
     #            #extracted_ethnicity == 'unknown' or extracted_specific_location == 'unknown')
     run_rag = True
     if run_rag:
         print("try run rag")
         # Determine the phrase for LLM query
 #     f"If the {explain_list} is not 'unknown', write 1 sentence after the output explaining how you inferred it from the text (one sentence for each)."
 #     f"\n\nText Snippets:\n{context_for_llm}\n\n"
 #     f"Output Format: {output_format_str}"
+# )
+#         prompt_for_llm = (
+#     f"{prompt_instruction_prefix}"
+#     f"Given the following text snippets, analyze the entity/concept {rag_query_phrase} "
+#     f"or the mitochondrial DNA sample in {organism} if these identifiers are not explicitly found. "
+#     f"Identify its **primary associated geographic location**, preferring the most specific available: "
+#     f"first try to determine the exact country; if no country is explicitly mentioned, then provide "
+#     f"the next most specific region, continent, island, or other clear geographic area mentioned. "
+#     f"If no geographic clues at all are present, state 'unknown' for location. "
+#     f"Also, determine if the genetic sample is from a 'modern' (present-day living individual) "
+#     f"or 'ancient' (prehistoric/archaeological) source. "
+#     f"If the text does not specify ancient or archaeological context, assume 'modern'. "
+#     f"Provide only {output_format_str}. "
+#     f"If any information is not explicitly present, use the fallback rules above before defaulting to 'unknown'. "
+#     f"For each non-'unknown' field in {explain_list}, write one sentence explaining how it was inferred from the text (one sentence for each)."
+#     f"\n\nText Snippets:\n{context_for_llm}\n\n"
+#     f"Output Format: {output_format_str}"
 # )
         prompt_for_llm = (
     f"{prompt_instruction_prefix}"
     f"If the text does not specify ancient or archaeological context, assume 'modern'. "
     f"Provide only {output_format_str}. "
     f"If any information is not explicitly present, use the fallback rules above before defaulting to 'unknown'. "
+    f"For each non-'unknown' field in {explain_list}, write one sentence explaining how it was inferred from the text "
+    f"(one sentence for each). "
+    f"Format your answer so that:\n"
+    f"1. The **first line** contains only the {output_format_str} answer.\n"
+    f"2. The **second line onward** contains the explanations.\n"
+    f"\nText Snippets:\n{context_for_llm}\n\n"
+    f"Output Format Example:\nChina, modern, Daur, Heilongjiang province.\n"
+    f"The text explicitly states \"chinese Daur ethnic group in Heilongjiang province\", indicating the country, "
+    f"the ethnicity, and the specific province. The study is published in a journal, implying research on living "
+    f"individuals, hence modern."
 )
+        if model_ai:
+          print("back up to ", model_ai)
+          llm_response_text, model_instance = call_llm_api(prompt_for_llm, model=model_ai)
+        else:
+          print("still 2.5 flash gemini")
+          llm_response_text, model_instance = call_llm_api(prompt_for_llm)
         print("\n--- DEBUG INFO FOR RAG ---")
         print("Retrieved Context Sent to LLM (first 500 chars):")
         print(context_for_llm[:500] + "..." if len(context_for_llm) > 500 else context_for_llm)