Update app.py
Browse files
app.py
CHANGED
@@ -3,12 +3,15 @@ import pandas as pd
|
|
3 |
import gradio as gr
|
4 |
|
5 |
df=pd.read_parquet('df.parquet')
|
6 |
-
#df2=pd.read_parquet('df2.parquet')
|
7 |
-
#df=df.merge(df2)
|
8 |
dirname='lot3'
|
9 |
|
10 |
df['fileclean']=df.file.str.replace(f'.*{dirname}/[^/]+/','').str.replace('[\(\)]','').str.replace('/[^/]+$','').str.replace('/',' ').str.replace('-',' ').str.replace(' 0+',' ')
|
11 |
candidats=pd.read_parquet('candidats.parquet')
|
|
|
|
|
|
|
|
|
|
|
12 |
|
13 |
document_store = InMemoryDocumentStore(use_bm25=True)
|
14 |
docs=df.drop_duplicates(subset=['fileclean']).rename(columns={'fileclean':'content'}).to_dict(orient='records')
|
|
|
3 |
import gradio as gr
|
4 |
|
5 |
df=pd.read_parquet('df.parquet')
|
|
|
|
|
6 |
dirname='lot3'
|
7 |
|
8 |
df['fileclean']=df.file.str.replace(f'.*{dirname}/[^/]+/','').str.replace('[\(\)]','').str.replace('/[^/]+$','').str.replace('/',' ').str.replace('-',' ').str.replace(' 0+',' ')
|
9 |
candidats=pd.read_parquet('candidats.parquet')
|
10 |
+
df2=pd.read_parquet('df2.parquet')
|
11 |
+
for c in df2.columns:
|
12 |
+
candidats[c]=candidats[c].astype(str)
|
13 |
+
df2[c]=df2[c].astype(str)
|
14 |
+
candidats=candidats.merge(df2)
|
15 |
|
16 |
document_store = InMemoryDocumentStore(use_bm25=True)
|
17 |
docs=df.drop_duplicates(subset=['fileclean']).rename(columns={'fileclean':'content'}).to_dict(orient='records')
|