Spaces:

Ahmed235
/

final

Sleeping

App Files Files Community

Ahmed235 commited on Mar 4, 2024

Commit

18332e8

verified ·

1 Parent(s): 1a023c5

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -24

app.py CHANGED Viewed

@@ -1,15 +1,8 @@
 import gradio as gr
-from transformers import AutoTokenizer, AutoModelForSequenceClassification
-import torch
-import torch.nn.functional as F
-from pptx import Presentation
-import re
-# Load the pre-trained model and tokenizer using gr.load
-model = gr.load("models/Ahmed235/roberta_classification")
-# Tokenizer can be loaded using transformers directly
-tokenizer = AutoTokenizer.from_pretrained("Ahmed235/roberta_classification")
 def extract_text_from_pptx(file_path):
     presentation = Presentation(file_path)
@@ -23,22 +16,12 @@ def extract_text_from_pptx(file_path):
 def predict_pptx_content(file_path):
     try:
         extracted_text = extract_text_from_pptx(file_path)
-        cleaned_text = re.sub(r'\s+', ' ', extracted_text)
-        # Tokenize and encode the cleaned text
-        input_encoding = tokenizer(cleaned_text, truncation=True, padding=True, return_tensors="pt")
-        input_encoding = {key: val.to(device) for key, val in input_encoding.items()}  # Move input tensor to CPU
-        # Perform inference
-        with torch.no_grad():
-            outputs = model(**input_encoding)
-            logits = outputs.logits
-        probabilities = F.softmax(logits, dim=1)
-        predicted_label_id = torch.argmax(logits, dim=1).item()
-        predicted_label = model.config.id2label[predicted_label_id]
-        predicted_probability = probabilities[0][predicted_label_id].item()
         prediction = {
             "Predicted Label": predicted_label,

 import gradio as gr
+from transformers import pipeline
+# Create a text classification pipeline
+classifier = pipeline("text-classification", model="Ahmed235/roberta_classification", tokenizer="Ahmed235/roberta_classification")
 def extract_text_from_pptx(file_path):
     presentation = Presentation(file_path)
 def predict_pptx_content(file_path):
     try:
         extracted_text = extract_text_from_pptx(file_path)
+        # Perform inference using the pipeline
+        result = classifier(extracted_text)
+        predicted_label = result[0]['label']
+        predicted_probability = result[0]['score']
         prediction = {
             "Predicted Label": predicted_label,