Spaces:

mayf
/

1

Sleeping

App Files Files Community

mayf commited on 21 days ago

Commit

1d35b1e

verified ·

1 Parent(s): 4b3b42f

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -8

app.py CHANGED Viewed

@@ -30,9 +30,17 @@ def load_sentiment_pipeline():
 def load_keybert_model():
     return KeyBERT(model="all-MiniLM-L6-v2")
-# ─── BlenderBot Response Pipeline ───────────────────────────────────────────
 @st.cache_resource
-def load_response_pipeline():
     # Use BlenderBot 400M Distill for text generation
     return pipeline(
         "text2text-generation",
@@ -100,22 +108,33 @@ def main():
     st.markdown(f"**Highest Sentiment:** **{max_label}** ({max_score:.4f})")
     # ────────────────────────────────────────────────────────────────────
-    # Generate appropriate reply
-    response_pipeline = load_response_pipeline()
     if max_label in ["Positive", "Very Positive"]:
-        prompt = (
             f"You are a friendly customer success representative. The customer said: \"{review}\". "
             "Write two sentences to express gratitude and highlight their positive experience."
         )
     else:
-        prompt = (
             f"You are a helpful customer support specialist. The customer said: \"{review}\". "
             f"Identified issues: {', '.join([kw for kw, _ in keywords])}. "
             "First, ask 1-2 clarifying questions to understand their situation. "
             "Then provide two concrete suggestions or next steps to address these issues."
         )
-    result = response_pipeline(prompt)
-    reply = result[0]['generated_text'].strip()
     st.subheader("Generated Reply")
     st.write(reply)

 def load_keybert_model():
     return KeyBERT(model="all-MiniLM-L6-v2")
+# ─── BlenderBot Response Components ─────────────────────────────────────────
 @st.cache_resource
+def load_response_components():
+    # Load tokenizer and model directly for manual generation with truncation
+    tok = AutoTokenizer.from_pretrained(
+        "facebook/blenderbot-400M-distill",
+        use_fast=True
+    )
+    mdl = AutoModelForSeq2SeqLM.from_pretrained("facebook/blenderbot-400M-distill")
+    return tok, mdl
+:
     # Use BlenderBot 400M Distill for text generation
     return pipeline(
         "text2text-generation",
     st.markdown(f"**Highest Sentiment:** **{max_label}** ({max_score:.4f})")
     # ────────────────────────────────────────────────────────────────────
+    # Generate appropriate reply using manual tokenization & generation
+    tok, mdl = load_response_components()
     if max_label in ["Positive", "Very Positive"]:
+        prompt_text = (
             f"You are a friendly customer success representative. The customer said: \"{review}\". "
             "Write two sentences to express gratitude and highlight their positive experience."
         )
     else:
+        prompt_text = (
             f"You are a helpful customer support specialist. The customer said: \"{review}\". "
             f"Identified issues: {', '.join([kw for kw, _ in keywords])}. "
             "First, ask 1-2 clarifying questions to understand their situation. "
             "Then provide two concrete suggestions or next steps to address these issues."
         )
+    # Tokenize with truncation to avoid out-of-range embeddings
+    inputs = tok(
+        prompt_text,
+        return_tensors="pt",
+        truncation=True,
+        max_length=tok.model_max_length
+    )
+    outputs = mdl.generate(
+        **inputs,
+        max_new_tokens=150,
+        do_sample=False
+    )
+    reply = tok.decode(outputs[0], skip_special_tokens=True).strip()
     st.subheader("Generated Reply")
     st.write(reply)