Spaces:

raynardj
/

duguwen-classical-chinese-to-morden-translate

Runtime error

App Files Files Community

raynardj commited on Jan 5, 2022

Commit

2fc06de

1 Parent(s): e0a6c5a

🎸 logging

Browse files

Files changed (1) hide show

app.py +9 -9

app.py CHANGED Viewed

@@ -24,6 +24,7 @@ tokenizer, model = load_model()
 def inference(text):
     tk_kwargs = dict(
         truncation=True,
         max_length=168,
@@ -32,7 +33,7 @@ def inference(text):
     inputs = tokenizer([text, ], **tk_kwargs)
     with torch.no_grad():
-        return tokenizer.batch_decode(
             model.generate(
                 inputs.input_ids,
                 attention_mask=inputs.attention_mask,
@@ -42,6 +43,8 @@ def inference(text):
                 eos_token_id=tokenizer.sep_token_id,
                 pad_token_id=tokenizer.pad_token_id,
             ), skip_special_tokens=True)[0].replace(" ", "")
 @st.cache
@@ -96,6 +99,7 @@ def fetch_file(path):
     obj_hash = file_obj_hash_map[path]
     auth = HTTPBasicAuth(USER_ID, SECRET)
     url = f"https://api.github.com/repos/garychowcmu/daizhigev20/git/blobs/{obj_hash}"
     r = requests.get(url, auth=auth)
     if r.status_code == 200:
         data = r.json()
@@ -121,8 +125,6 @@ def show_filepath(filepath: str):
 if st.sidebar.selectbox(label="何以尋跡 How to search",options=["以類尋書 category","書名求書 search"])=="以類尋書 category":
-    st.session_state.translating = False
     # root_data = fetch_from_github()
     if 'pathway' in st.session_state:
         pass
@@ -151,12 +153,14 @@ if st.sidebar.selectbox(label="何以尋跡 How to search",options=["以類尋
                 with st.spinner(f"Load 載文:{filepath},({show_file_size(file_size)})"):
                     # if file size is too large, we will not load it
                     if file_size > 3*1024*1024:
                         urlpath = filepath.replace(".txt", ".html")
                         dzg = f"http://www.daizhige.org/{urlpath}"
                         st.markdown(f"File too big 其文碩而難載，不能為之，[往 殆知閣]({dzg}), 或擇他書")
                         reset_path()
                         return None
                     path_text.text(filepath)
                     text = fetch_file(filepath)
                     # create markdown with max heights
                     c.markdown(
@@ -170,8 +174,7 @@ if st.sidebar.selectbox(label="何以尋跡 How to search",options=["以類尋
                 path_text.text("/".join(st.session_state.pathway))
                 display_tree()
-    if st.session_state.translating == False:
-        display_tree()
 else:
     def search_kw():
         result = file_df[file_df.filepath.str.contains(st.session_state.kw)].reset_index(drop=True)
@@ -186,12 +189,10 @@ else:
         st.session_state.kw = kw
         search_kw()
-    if st.session_state.translating == False:
-        loading_with_search()
 def translate_text():
-    st.session_state.translating = True
     if c2.button("【曉文達義 Translate】"):
         if cc:
             if len(cc) > 168:
@@ -200,7 +201,6 @@ def translate_text():
                 c2.markdown(f"""```{inference(cc)}```""")
         else:
             c2.write("【入難曉之文字 Please input sentence for translating】")
-    st.session_state.translating = False
 cc = c2.text_area("【入難曉之文字 Input sentence】", height=150)
 translate_text()

 def inference(text):
+    print(f"from: {text}")
     tk_kwargs = dict(
         truncation=True,
         max_length=168,
     inputs = tokenizer([text, ], **tk_kwargs)
     with torch.no_grad():
+        new = tokenizer.batch_decode(
             model.generate(
                 inputs.input_ids,
                 attention_mask=inputs.attention_mask,
                 eos_token_id=tokenizer.sep_token_id,
                 pad_token_id=tokenizer.pad_token_id,
             ), skip_special_tokens=True)[0].replace(" ", "")
+    print(f"to: {new}")
+    return new
 @st.cache
     obj_hash = file_obj_hash_map[path]
     auth = HTTPBasicAuth(USER_ID, SECRET)
     url = f"https://api.github.com/repos/garychowcmu/daizhigev20/git/blobs/{obj_hash}"
+    print(f"requesting {url}")
     r = requests.get(url, auth=auth)
     if r.status_code == 200:
         data = r.json()
 if st.sidebar.selectbox(label="何以尋跡 How to search",options=["以類尋書 category","書名求書 search"])=="以類尋書 category":
     # root_data = fetch_from_github()
     if 'pathway' in st.session_state:
         pass
                 with st.spinner(f"Load 載文:{filepath},({show_file_size(file_size)})"):
                     # if file size is too large, we will not load it
                     if file_size > 3*1024*1024:
+                        print(f"skip {filepath}")
                         urlpath = filepath.replace(".txt", ".html")
                         dzg = f"http://www.daizhige.org/{urlpath}"
                         st.markdown(f"File too big 其文碩而難載，不能為之，[往 殆知閣]({dzg}), 或擇他書")
                         reset_path()
                         return None
                     path_text.text(filepath)
+                    print(f"read {filepath}")
                     text = fetch_file(filepath)
                     # create markdown with max heights
                     c.markdown(
                 path_text.text("/".join(st.session_state.pathway))
                 display_tree()
+    display_tree()
 else:
     def search_kw():
         result = file_df[file_df.filepath.str.contains(st.session_state.kw)].reset_index(drop=True)
         st.session_state.kw = kw
         search_kw()
+    loading_with_search()
 def translate_text():
     if c2.button("【曉文達義 Translate】"):
         if cc:
             if len(cc) > 168:
                 c2.markdown(f"""```{inference(cc)}```""")
         else:
             c2.write("【入難曉之文字 Please input sentence for translating】")
 cc = c2.text_area("【入難曉之文字 Input sentence】", height=150)
 translate_text()