Spaces:

tahirsher
/

Cooking_Receips

Sleeping

tahirsher commited on Oct 17, 2024

Commit

2c7d942

verified ·

1 Parent(s): d8997e3

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,22 +1,24 @@
 import streamlit as st
 from transformers import pipeline
 # Initialize the text generation pipeline with the GPT-2 fine-tuned recipe model
 pipe = pipeline("text-generation", model="mrm8488/gpt2-finetuned-recipes-cooking_v2")
 def clean_recipe(text):
-    # Split the generated text into sentences using both "." and other common delimiters
-    steps = text.replace("\n", " ").split('.')
-    # Remove any extra spaces and filter out empty or repetitive steps
     cleaned_steps = []
     seen_steps = set()  # Track steps to avoid repetition
     for step in steps:
         step = step.strip()  # Remove leading/trailing spaces
-        if step and step.lower() not in seen_steps:  # Skip empty or repetitive steps
             cleaned_steps.append(step)
-            seen_steps.add(step.lower())  # Add step to the seen set
     return cleaned_steps

 import streamlit as st
 from transformers import pipeline
+import re
 # Initialize the text generation pipeline with the GPT-2 fine-tuned recipe model
 pipe = pipeline("text-generation", model="mrm8488/gpt2-finetuned-recipes-cooking_v2")
 def clean_recipe(text):
+    # Split text into sentences based on periods, question marks, or exclamation points
+    steps = re.split(r'(?<=[.!?])\s+', text)
+    # Remove any irrelevant or overly technical information by filtering based on length and content
     cleaned_steps = []
     seen_steps = set()  # Track steps to avoid repetition
     for step in steps:
         step = step.strip()  # Remove leading/trailing spaces
+        # Skip irrelevant or short steps and avoid repetitions
+        if len(step) > 20 and step.lower() not in seen_steps:
             cleaned_steps.append(step)
+            seen_steps.add(step.lower())  # Track unique steps
     return cleaned_steps