Spaces:
Sleeping
Sleeping
Commit
·
1408e00
1
Parent(s):
1710631
updated app.py
Browse files
app.py
CHANGED
@@ -73,14 +73,36 @@ class ModelWrapper:
|
|
73 |
do_sample=True,
|
74 |
pad_token_id=self.tokenizer.pad_token_id,
|
75 |
eos_token_id=self.tokenizer.eos_token_id,
|
76 |
-
repetition_penalty=1.
|
|
|
|
|
|
|
77 |
)
|
78 |
|
79 |
# Decode response
|
80 |
response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
|
|
|
|
|
81 |
if response.startswith(prompt):
|
82 |
response = response[len(prompt):].strip()
|
83 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
84 |
generation_time = time.time() - start_time
|
85 |
return response, generation_time
|
86 |
except Exception as e:
|
|
|
73 |
do_sample=True,
|
74 |
pad_token_id=self.tokenizer.pad_token_id,
|
75 |
eos_token_id=self.tokenizer.eos_token_id,
|
76 |
+
repetition_penalty=1.2, # Increased to reduce repetition
|
77 |
+
no_repeat_ngram_size=3, # Prevent repeating of 3-grams
|
78 |
+
early_stopping=True, # Stop when EOS token is generated
|
79 |
+
stopping_criteria=None # Will use default stopping criteria
|
80 |
)
|
81 |
|
82 |
# Decode response
|
83 |
response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
|
84 |
+
|
85 |
+
# Clean up the response
|
86 |
if response.startswith(prompt):
|
87 |
response = response[len(prompt):].strip()
|
88 |
|
89 |
+
# Remove common closure patterns
|
90 |
+
closures = [
|
91 |
+
"Best regards,",
|
92 |
+
"Sincerely,",
|
93 |
+
"Thanks,",
|
94 |
+
"Thank you,",
|
95 |
+
"Regards,",
|
96 |
+
"Assistant:",
|
97 |
+
"Human:",
|
98 |
+
"[Your Name]",
|
99 |
+
"[Student]"
|
100 |
+
]
|
101 |
+
|
102 |
+
for closure in closures:
|
103 |
+
if closure.lower() in response.lower():
|
104 |
+
response = response[:response.lower().find(closure.lower())].strip()
|
105 |
+
|
106 |
generation_time = time.time() - start_time
|
107 |
return response, generation_time
|
108 |
except Exception as e:
|