Spaces:

WhiteAngelss
/

turkce-varlik-tanima-teknofest-nlp

Running

App Files Files Community

ihsan66 commited on Jul 30

Commit

1574088

•

1 Parent(s): 28500ed

Update app.py

Browse files

Files changed (1) hide show

app.py +45 -12

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import streamlit as st
-from transformers import pipeline, AutoModelForSequenceClassification, AutoTokenizer, AutoModelForTokenClassification, AutoModelWithLMHead
 import pandas as pd
 # Uygulama sayfa ayarları
@@ -16,12 +16,12 @@ example_list = [
 st.title("NLP Toolkit")
 # Görev seçimi
-task_list = ['Metin Sınıflandırma', 'Metin Analizi', 'Duygu Analizi', 'Metin Oluşturma']
 task = st.sidebar.selectbox("Görev Seç", task_list)
 # Metin giriş yöntemi
 st.subheader("Metin Giriş Yöntemi Seç")
-input_method = st.radio("", ('Örneklerden Seç', 'Metin Yaz veya Yapıştır', 'Dosya Yükle'))
 # Metin girişine göre seçim
 if input_method == 'Örneklerden Seç':
@@ -29,12 +29,6 @@ if input_method == 'Örneklerden Seç':
     input_text = st.text_area("Seçilen Metin", selected_text, height=128)
 elif input_method == "Metin Yaz veya Yapıştır":
     input_text = st.text_area('Metin Yaz veya Yapıştır', '', height=128)
-elif input_method == "Dosya Yükle":
-    uploaded_file = st.file_uploader("Dosya Seç", type="txt")
-    if uploaded_file is not None:
-        input_text = str(uploaded_file.read(), "utf-8")
-    else:
-        input_text = ""
 @st.cache_resource
 def load_pipeline(model_name, task_type):
@@ -51,16 +45,17 @@ def load_pipeline(model_name, task_type):
         tokenizer = AutoTokenizer.from_pretrained(model_name)
         return pipeline('sentiment-analysis', model=model, tokenizer=tokenizer)
     elif task_type == "Metin Oluşturma":
-        model = AutoModelWithLMHead.from_pretrained(model_name)
         tokenizer = AutoTokenizer.from_pretrained(model_name)
         return pipeline('text-generation', model=model, tokenizer=tokenizer)
 # Görev ve modele göre pipeline yükleme
 model_dict = {
     "Metin Sınıflandırma": "nlptown/bert-base-multilingual-uncased-sentiment",
-    "Metin Analizi": "dbmdz/bert-large-cased-finetuned-conll03-english",
     "Duygu Analizi": "cardiffnlp/twitter-roberta-base-sentiment",
-    "Metin Oluşturma": "gpt2"
 }
 pipeline_model = load_pipeline(model_dict[task], task)
@@ -80,3 +75,41 @@ if st.button("Çalıştır") and input_text:
         output = pipeline_model(input_text, max_length=100, num_return_sequences=1)
         st.subheader("Oluşturulan Metin")
         st.write(output[0]['generated_text'])

 import streamlit as st
+from transformers import pipeline, AutoModelForSequenceClassification, AutoTokenizer, AutoModelForTokenClassification, AutoModelForCausalLM
 import pandas as pd
 # Uygulama sayfa ayarları
 st.title("NLP Toolkit")
 # Görev seçimi
+task_list = ['Metin Sınıflandırma', 'Metin Analizi', 'Duygu Analizi', 'Metin Oluşturma', 'Varlık Tanıma']
 task = st.sidebar.selectbox("Görev Seç", task_list)
 # Metin giriş yöntemi
 st.subheader("Metin Giriş Yöntemi Seç")
+input_method = st.radio("", ('Örneklerden Seç', 'Metin Yaz veya Yapıştır'))
 # Metin girişine göre seçim
 if input_method == 'Örneklerden Seç':
     input_text = st.text_area("Seçilen Metin", selected_text, height=128)
 elif input_method == "Metin Yaz veya Yapıştır":
     input_text = st.text_area('Metin Yaz veya Yapıştır', '', height=128)
 @st.cache_resource
 def load_pipeline(model_name, task_type):
         tokenizer = AutoTokenizer.from_pretrained(model_name)
         return pipeline('sentiment-analysis', model=model, tokenizer=tokenizer)
     elif task_type == "Metin Oluşturma":
+        model = AutoModelForCausalLM.from_pretrained(model_name)
         tokenizer = AutoTokenizer.from_pretrained(model_name)
         return pipeline('text-generation', model=model, tokenizer=tokenizer)
 # Görev ve modele göre pipeline yükleme
 model_dict = {
     "Metin Sınıflandırma": "nlptown/bert-base-multilingual-uncased-sentiment",
+    "Metin Analizi": "dbmdz/bert-base-turkish-cased",  # Türkçe model
     "Duygu Analizi": "cardiffnlp/twitter-roberta-base-sentiment",
+    "Metin Oluşturma": "gpt2",
+    "Varlık Tanıma": "dbmdz/bert-base-turkish-cased"  # Türkçe NER model
 }
 pipeline_model = load_pipeline(model_dict[task], task)
         output = pipeline_model(input_text, max_length=100, num_return_sequences=1)
         st.subheader("Oluşturulan Metin")
         st.write(output[0]['generated_text'])
+    elif task == "Varlık Tanıma":
+        output = pipeline_model(input_text)
+        entities = []
+        for item in output:
+            entities.append({
+                'Label': item['entity'],
+                'Score': item['score'],
+                'Word': item['word'],
+                'Start': item['start'],
+                'End': item['end']
+            })
+        df = pd.DataFrame(entities)
+        st.subheader("Varlık Tanıma Sonuçları")
+        st.dataframe(df)
+        # Metni formatla
+        def format_text(text_data):
+            formatted_text = ""
+            last_end = 0
+            for item in text_data:
+                if item['Start'] > last_end:
+                    formatted_text += input_text[last_end:item['Start']]
+                word = item['Word']
+                label = item['Label']
+                if label.startswith('I-'):
+                    color = 'blue'
+                elif label.startswith('B-'):
+                    color = 'green'
+                else:
+                    color = 'gray'
+                formatted_text += f"<span style='color:{color};'>{word}</span>"
+                last_end = item['End']
+            if last_end < len(input_text):
+                formatted_text += input_text[last_end:]
+            return formatted_text
+        formatted_text = format_text(entities)
+        st.subheader("Analiz Edilen Metin")
+        st.markdown(f"<p>{formatted_text}</p>", unsafe_allow_html=True)