Spaces:
Runtime error
Runtime error
Commit
·
5a994f8
1
Parent(s):
84fa2e9
threading error onnx fix
Browse files
app.py
CHANGED
@@ -87,9 +87,12 @@ hide_streamlit_style = """
|
|
87 |
"""
|
88 |
st.markdown(hide_streamlit_style, unsafe_allow_html=True)
|
89 |
|
90 |
-
options
|
91 |
-
|
92 |
-
|
|
|
|
|
|
|
93 |
|
94 |
|
95 |
@st.cache(allow_output_mutation=True, suppress_st_warning=True, max_entries=None, ttl=None)
|
@@ -139,7 +142,7 @@ def sentiment_task_selected(task,
|
|
139 |
# create_onnx_model_sentiment(_model=model_sentiment, _tokenizer=tokenizer_sentiment)
|
140 |
|
141 |
#create inference session
|
142 |
-
sentiment_session = ort.InferenceSession(f"{sent_onnx_mdl_dir}/{sent_onnx_mdl_name}")
|
143 |
# sentiment_session_quant = ort.InferenceSession(f"{sent_onnx_mdl_dir}/{sent_onnx_quant_mdl_name}")
|
144 |
|
145 |
return tokenizer_sentiment,sentiment_session
|
@@ -170,7 +173,7 @@ def zs_task_selected(task,
|
|
170 |
# create_onnx_model_zs()
|
171 |
|
172 |
#create inference session from onnx model
|
173 |
-
zs_session = ort.InferenceSession(f"{zs_onnx_mdl_dir}/{zs_onnx_mdl_name}")
|
174 |
# zs_session_quant = ort.InferenceSession(f"{zs_onnx_mdl_dir}/{zs_onnx_quant_mdl_name}")
|
175 |
|
176 |
return tokenizer_zs,zs_session
|
|
|
87 |
"""
|
88 |
st.markdown(hide_streamlit_style, unsafe_allow_html=True)
|
89 |
|
90 |
+
#onnx runtime inference threading changes -- session options must be passed in session run
|
91 |
+
# os.environ["OMP_NUM_THREADS"] = "1"
|
92 |
+
session_options_ort = ort.SessionOptions()
|
93 |
+
session_options_ort.intra_op_num_threads=1
|
94 |
+
session_options_ort.inter_op_num_threads=1
|
95 |
+
# session_options_ort.execution_mode = session_options_ort.ExecutionMode.ORT_SEQUENTIAL
|
96 |
|
97 |
|
98 |
@st.cache(allow_output_mutation=True, suppress_st_warning=True, max_entries=None, ttl=None)
|
|
|
142 |
# create_onnx_model_sentiment(_model=model_sentiment, _tokenizer=tokenizer_sentiment)
|
143 |
|
144 |
#create inference session
|
145 |
+
sentiment_session = ort.InferenceSession(f"{sent_onnx_mdl_dir}/{sent_onnx_mdl_name}",sess_options=session_options_ort)
|
146 |
# sentiment_session_quant = ort.InferenceSession(f"{sent_onnx_mdl_dir}/{sent_onnx_quant_mdl_name}")
|
147 |
|
148 |
return tokenizer_sentiment,sentiment_session
|
|
|
173 |
# create_onnx_model_zs()
|
174 |
|
175 |
#create inference session from onnx model
|
176 |
+
zs_session = ort.InferenceSession(f"{zs_onnx_mdl_dir}/{zs_onnx_mdl_name}",sess_options=session_options_ort)
|
177 |
# zs_session_quant = ort.InferenceSession(f"{zs_onnx_mdl_dir}/{zs_onnx_quant_mdl_name}")
|
178 |
|
179 |
return tokenizer_zs,zs_session
|