Spaces:

domenicrosati
/

scite-qa-demo

Runtime error

App Files Files Community

domenicrosati commited on Sep 19, 2022

Commit

82fe24c

1 Parent(s): 8457196

try fallback

Browse files

Files changed (1) hide show

app.py +23 -6

app.py CHANGED Viewed

@@ -150,12 +150,15 @@ st.markdown("""
 """, unsafe_allow_html=True)
 with st.expander("Settings (strictness, context limit, top hits)"):
     confidence_threshold = st.slider('Confidence threshold for answering questions? This number represents how confident the model should be in the answers it gives. The number is out of 100%', 0, 100, 1)
     use_reranking = st.radio(
         "Use Reranking? Reranking will rerank the top hits using semantic similarity of document and query.",
         ('yes', 'no'))
     top_hits_limit = st.slider('Top hits? How many documents to use for reranking. Larger is slower but higher quality', 10, 300, 100)
-    context_lim = st.slider('Context limit? How many documents to use for answering from. Larger is slower but higher quality', 10, 300, 25)
 # def paraphrase(text, max_length=128):
 #     input_ids = queryexp_tokenizer.encode(text, return_tensors="pt", add_special_tokens=True)
@@ -171,15 +174,29 @@ def run_query(query):
 # If you are not getting good results try one of:
 # * {query_exp}
 # """)
     limit = top_hits_limit or 100
     context_limit = context_lim or 10
     contexts_strict, orig_docs_strict = search(query, limit=limit, strict=True)
-    contexts_lenient, orig_docs_lenient = search(query, limit=limit, strict=False)
-    contexts = list(
-        set(contexts_strict + contexts_lenient)
-    )
-    orig_docs = orig_docs_strict + orig_docs_lenient
     if len(contexts) == 0 or not ''.join(contexts).strip():
         return st.markdown("""

 """, unsafe_allow_html=True)
 with st.expander("Settings (strictness, context limit, top hits)"):
+    strict_lenient_mix = st.radio(
+        "Type of strict+lenient combination: Fallback or Mix? If fallback, strict is run first then if the results are less than context_lim we also search lenient. Mix will search them both and let reranking sort em out",
+        ('fallback', 'mix'))
     confidence_threshold = st.slider('Confidence threshold for answering questions? This number represents how confident the model should be in the answers it gives. The number is out of 100%', 0, 100, 1)
     use_reranking = st.radio(
         "Use Reranking? Reranking will rerank the top hits using semantic similarity of document and query.",
         ('yes', 'no'))
     top_hits_limit = st.slider('Top hits? How many documents to use for reranking. Larger is slower but higher quality', 10, 300, 100)
+    context_lim = st.slider('Context limit? How many documents to use for answering from. Larger is slower but higher quality', 10, 300, 10)
 # def paraphrase(text, max_length=128):
 #     input_ids = queryexp_tokenizer.encode(text, return_tensors="pt", add_special_tokens=True)
 # If you are not getting good results try one of:
 # * {query_exp}
 # """)
+    # could also try fallback if there are no good answers by score...
     limit = top_hits_limit or 100
     context_limit = context_lim or 10
     contexts_strict, orig_docs_strict = search(query, limit=limit, strict=True)
+    if strict_lenient_mix == 'fallback' and len(contexts_strict) < context_limit:
+        contexts_lenient, orig_docs_lenient = search(query, limit=limit, strict=False)
+        contexts = list(
+            set(contexts_strict + contexts_lenient)
+        )
+        orig_docs = orig_docs_strict + orig_docs_lenient
+    elif strict_lenient_mix == 'mix':
+        contexts_lenient, orig_docs_lenient = search(query, limit=limit, strict=False)
+        contexts = list(
+            set(contexts_strict + contexts_lenient)
+        )
+        orig_docs = orig_docs_strict + orig_docs_lenient
+    else:
+        contexts = list(
+            set(contexts_strict)
+        )
+        orig_docs = orig_docs_strict
     if len(contexts) == 0 or not ''.join(contexts).strip():
         return st.markdown("""