Spaces:

madoss
/

gdiy

Runtime error

madoss commited on Aug 9, 2022

Commit

1013d06

1 Parent(s): d139382

add topics

Files changed (2) hide show

app.py CHANGED Viewed

@@ -63,15 +63,11 @@ stopword = stopword + context # add some frequent words in the documents
 clean_text = df_clean['description'].apply(lambda x: clean_up1(x, stopword, pos))
 docs = clean_text.apply(lambda x: " ".join(x)).tolist()
-topic_model = BERTopic(language="multilingual",
-                       nr_topics=6,
-                       top_n_words=30,
-                       low_memory=True,
-                       n_gram_range=(1, 2))
-topics, _ = topic_model.fit_transform(docs)
-topic_fig = topic_model.visualize_barchart(n_words=10)
 timestamps = df_clean.index
 topics_over_time = topic_model.topics_over_time(docs, topics, timestamps,
@@ -86,6 +82,8 @@ topics_over_time.set_index('Timestamp', inplace=True)
 topics_over_time['year'] = topics_over_time.index.year
 topic_per_year = topics_over_time.groupby(['year'])['Words'].apply(lambda x: x.str.cat(sep=' '))
 fig1, ax = plt.subplots()
 sns.countplot(ax=ax, x='year', data=df_clean, palette='viridis');

 clean_text = df_clean['description'].apply(lambda x: clean_up1(x, stopword, pos))
 docs = clean_text.apply(lambda x: " ".join(x)).tolist()
+topic_model = BERTopic.load("bertopic")
+with open('topics', 'rb') as f:
+    topics = pickle.load(f)
 timestamps = df_clean.index
 topics_over_time = topic_model.topics_over_time(docs, topics, timestamps,
 topics_over_time['year'] = topics_over_time.index.year
 topic_per_year = topics_over_time.groupby(['year'])['Words'].apply(lambda x: x.str.cat(sep=' '))
+topic_fig = topic_model.visualize_barchart(n_words=10)
 fig1, ax = plt.subplots()
 sns.countplot(ax=ax, x='year', data=df_clean, palette='viridis');

topics ADDED Viewed

Binary file (1.17 kB). View file