kambris commited on
Commit
8585464
ยท
verified ยท
1 Parent(s): 84cf1b5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -59,7 +59,7 @@ ARABIC_STOP_WORDS = {
59
  'ูˆูƒุงู†', 'ูˆูƒุงู†ุช', 'ูˆูƒู„', 'ูˆุจุนุถ', 'ูˆุญูˆู„', 'ูˆุนู†ุฏ', 'ูˆู‚ุฏ',
60
  'ูˆู„ู‚ุฏ', 'ูˆู„ู…', 'ูˆู„ู†', 'ูˆู…ุง', 'ูˆูƒูŠู', 'ูˆุงูŠู†', 'ูˆุงู„ุฐูŠ',
61
  'ูˆุจูŠู†', 'ูˆู‚ุจู„', 'ูˆุจุนุฏ', 'ูˆู„ู‡', 'ูˆู„ู‡ุง', 'ูˆู‡ู†ุงูƒ', 'ูˆุงู†ู‡',
62
- 'ูˆู„ุฏู‰', 'ูˆุนู„ูŠู‡', 'ูˆู…ุซู„',
63
 
64
  # Arabic numbers
65
  'ูˆุงุญุฏ', 'ุงุซู†ุงู†', 'ุซู„ุงุซุฉ', 'ุฃุฑุจุนุฉ', 'ุฎู…ุณุฉ', 'ุณุชุฉ', 'ุณุจุนุฉ',
@@ -506,7 +506,7 @@ if uploaded_file is not None:
506
  df['country'] = df['country'].str.strip()
507
  df = df.dropna(subset=['country', 'poem'])
508
  # Extract 10 rows per country
509
- sampled_df = df.groupby('country').apply(lambda x: x.head(10)).reset_index(drop=True)
510
 
511
  st.subheader("Topic Modeling Settings")
512
  col1, col2 = st.columns(2)
 
59
  'ูˆูƒุงู†', 'ูˆูƒุงู†ุช', 'ูˆูƒู„', 'ูˆุจุนุถ', 'ูˆุญูˆู„', 'ูˆุนู†ุฏ', 'ูˆู‚ุฏ',
60
  'ูˆู„ู‚ุฏ', 'ูˆู„ู…', 'ูˆู„ู†', 'ูˆู…ุง', 'ูˆูƒูŠู', 'ูˆุงูŠู†', 'ูˆุงู„ุฐูŠ',
61
  'ูˆุจูŠู†', 'ูˆู‚ุจู„', 'ูˆุจุนุฏ', 'ูˆู„ู‡', 'ูˆู„ู‡ุง', 'ูˆู‡ู†ุงูƒ', 'ูˆุงู†ู‡',
62
+ 'ู…ู†ู‡','ุงู„ุง','ููŠู‡ุง','ูู„ุง','ูˆูƒู…','ูŠูƒู†','ุนู„ูŠูƒ','ู…ู†ู‡ุง','ูู…ุง','ู„ู‡ู…','ูŠูƒู†','ูˆุงู†ูŠ','ู‡ู„','ูู‡ู„','ุจูŠ','ู†ุญูˆ','ูƒูŠ','ุณูˆู','ูƒู†ุง','ู„ู†ุง','ู…ุนุง','ูƒู„ู…ุง','ูˆุฅุฐุง','ู…ู†ู‡','ุนู†ู‡','ุฅุฐ','ูƒู…','ุจู„','ููŠู‡ุง','ู‡ูƒุฐุง','ู„ู‡ู…','ูˆู„ุฏู‰', 'ูˆุนู„ูŠู‡', 'ูˆู…ุซู„',
63
 
64
  # Arabic numbers
65
  'ูˆุงุญุฏ', 'ุงุซู†ุงู†', 'ุซู„ุงุซุฉ', 'ุฃุฑุจุนุฉ', 'ุฎู…ุณุฉ', 'ุณุชุฉ', 'ุณุจุนุฉ',
 
506
  df['country'] = df['country'].str.strip()
507
  df = df.dropna(subset=['country', 'poem'])
508
  # Extract 10 rows per country
509
+ sampled_df = df.groupby('country').apply(lambda x: x.head(50)).reset_index(drop=True)
510
 
511
  st.subheader("Topic Modeling Settings")
512
  col1, col2 = st.columns(2)