Spaces:

spacerini
/

code-search

Sleeping

cakiki commited on Feb 25, 2023

Commit

1a2fbfc

1 Parent(s): d6cb72b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -27,8 +27,12 @@ def result_html(result, meta):
     f"<div><details><summary>{result[:250]}...</summary><p>{result[250:]}</p></details></div><br><hr><br>"
     )
-def format_results(results):
-    return "\n".join([result_html(result, meta) for result,meta in zip(results[TEXT_FIELD], results[METADATA_FIELD])])
 def page_0(query):
     untokenized_query = query
@@ -36,13 +40,13 @@ def page_0(query):
     hits = searcher.search(query, k=NUM_PAGES*RESULTS_PER_PAGE)
     ix = [int(hit.docid) for hit in hits]
     results = ds.select(ix).shard(num_shards=NUM_PAGES, index=0, contiguous=True) # no need to shard. split ix in batches instead. (would make sense if results was cacheable)
-    results = format_results(results)
     return results, [ix], gr.update(visible=True), untokenized_query
 def page_i(i, ix, query):
     ix = ix[0]
     results = ds.select(ix).shard(num_shards=NUM_PAGES, index=i, contiguous=True)
-    results = format_results(results)
     return results, [ix], query
 with gr.Blocks(css="#b {min-width:15px;background:transparent;border:white;box-shadow:none;}") as demo: #

     f"<div><details><summary>{result[:250]}...</summary><p>{result[250:]}</p></details></div><br><hr><br>"
     )
+def format_results(results, query):
+    text_content = results[TEXT_FIELD]
+    query_words = query.split()
+    for word in query_words:
+        text_content = [text.replace(word, f"<b>{word}</b>") for text in text_content]
+    return "\n".join([result_html(result, meta) for result,meta in zip(text_content, results[METADATA_FIELD])])
 def page_0(query):
     untokenized_query = query
     hits = searcher.search(query, k=NUM_PAGES*RESULTS_PER_PAGE)
     ix = [int(hit.docid) for hit in hits]
     results = ds.select(ix).shard(num_shards=NUM_PAGES, index=0, contiguous=True) # no need to shard. split ix in batches instead. (would make sense if results was cacheable)
+    results = format_results(results, untokenized_query)
     return results, [ix], gr.update(visible=True), untokenized_query
 def page_i(i, ix, query):
     ix = ix[0]
     results = ds.select(ix).shard(num_shards=NUM_PAGES, index=i, contiguous=True)
+    results = format_results(results, query)
     return results, [ix], query
 with gr.Blocks(css="#b {min-width:15px;background:transparent;border:white;box-shadow:none;}") as demo: #