Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -560,24 +560,25 @@ def chat_function(message, history, mode, progress=gr.Progress()):
|
|
560 |
|
561 |
try:
|
562 |
# Load model (this will run on GPU when GPU is allocated)
|
563 |
-
progress(0.05
|
564 |
tok, mod, dev = load_model()
|
565 |
|
566 |
# Create appropriate generator
|
567 |
if mode == "Quality (Slower, Better)":
|
568 |
generator = QualityGenerator(tok, mod, dev)
|
569 |
-
progress(0.1
|
570 |
else:
|
571 |
generator = SpeedGenerator(tok, mod, dev)
|
572 |
-
progress(0.1
|
573 |
|
574 |
# Generate response with progress callback
|
575 |
-
def progress_callback(pct,
|
576 |
-
progress(pct
|
|
|
577 |
|
578 |
response, stats = generator.generate(message, progress_callback)
|
579 |
|
580 |
-
progress(1.0
|
581 |
|
582 |
# Create performance info
|
583 |
perf_info = f"""**⚡ Performance Stats:**
|
|
|
560 |
|
561 |
try:
|
562 |
# Load model (this will run on GPU when GPU is allocated)
|
563 |
+
progress(0.05)
|
564 |
tok, mod, dev = load_model()
|
565 |
|
566 |
# Create appropriate generator
|
567 |
if mode == "Quality (Slower, Better)":
|
568 |
generator = QualityGenerator(tok, mod, dev)
|
569 |
+
progress(0.1)
|
570 |
else:
|
571 |
generator = SpeedGenerator(tok, mod, dev)
|
572 |
+
progress(0.1)
|
573 |
|
574 |
# Generate response with progress callback
|
575 |
+
def progress_callback(pct, status_msg):
|
576 |
+
progress(pct)
|
577 |
+
# We'll show status in the performance display instead
|
578 |
|
579 |
response, stats = generator.generate(message, progress_callback)
|
580 |
|
581 |
+
progress(1.0)
|
582 |
|
583 |
# Create performance info
|
584 |
perf_info = f"""**⚡ Performance Stats:**
|