Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
@@ -5,20 +5,20 @@ from concurrent.futures import ThreadPoolExecutor, as_completed
|
|
5 |
import uvicorn
|
6 |
import re
|
7 |
from dotenv import load_dotenv
|
8 |
-
|
9 |
from spaces import ZeroGPU
|
10 |
|
11 |
load_dotenv()
|
12 |
|
13 |
-
|
|
|
|
|
14 |
try:
|
15 |
ZeroGPU.initialize()
|
16 |
except Exception as e:
|
17 |
print(f"ZeroGPU initialization failed: {e}")
|
18 |
|
19 |
-
|
20 |
-
|
21 |
-
# Global data dictionary
|
22 |
global_data = {
|
23 |
'models': {},
|
24 |
'tokens': {
|
@@ -107,25 +107,17 @@ def remove_duplicates(text):
|
|
107 |
seen_lines = set()
|
108 |
for line in lines:
|
109 |
if line not in seen_lines:
|
110 |
-
seen_lines.add(line)
|
111 |
unique_lines.append(line)
|
|
|
112 |
return '\n'.join(unique_lines)
|
113 |
|
114 |
-
|
115 |
-
seen = set()
|
116 |
-
unique_responses = []
|
117 |
-
for response in responses:
|
118 |
-
normalized_response = remove_duplicates(response['response'])
|
119 |
-
if normalized_response not in seen:
|
120 |
-
seen.add(normalized_response)
|
121 |
-
unique_responses.append({'model': response['model'], 'response': normalized_response})
|
122 |
-
return unique_responses
|
123 |
-
|
124 |
def generate_model_response(model, inputs, top_k, top_p, temperature):
|
125 |
try:
|
126 |
-
|
|
|
127 |
except Exception as e:
|
128 |
-
print(f"Error generating
|
129 |
return ""
|
130 |
|
131 |
@app.post("/generate")
|
@@ -152,5 +144,12 @@ async def process_request(request: Request, call_next):
|
|
152 |
print(f"Request error: {e}")
|
153 |
raise HTTPException(status_code=500, detail="Internal Server Error")
|
154 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
155 |
if __name__ == "__main__":
|
156 |
uvicorn.run(app, host="0.0.0.0", port=8000)
|
|
|
5 |
import uvicorn
|
6 |
import re
|
7 |
from dotenv import load_dotenv
|
8 |
+
import gradio as gr
|
9 |
from spaces import ZeroGPU
|
10 |
|
11 |
load_dotenv()
|
12 |
|
13 |
+
app = FastAPI()
|
14 |
+
|
15 |
+
# Inicializar ZeroGPU
|
16 |
try:
|
17 |
ZeroGPU.initialize()
|
18 |
except Exception as e:
|
19 |
print(f"ZeroGPU initialization failed: {e}")
|
20 |
|
21 |
+
# Diccionario global para almacenar modelos y tokens
|
|
|
|
|
22 |
global_data = {
|
23 |
'models': {},
|
24 |
'tokens': {
|
|
|
107 |
seen_lines = set()
|
108 |
for line in lines:
|
109 |
if line not in seen_lines:
|
|
|
110 |
unique_lines.append(line)
|
111 |
+
seen_lines.add(line)
|
112 |
return '\n'.join(unique_lines)
|
113 |
|
114 |
+
@spaces.GPU(duration=0)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
115 |
def generate_model_response(model, inputs, top_k, top_p, temperature):
|
116 |
try:
|
117 |
+
response = model.generate(inputs, top_k=top_k, top_p=top_p, temperature=temperature)
|
118 |
+
return remove_duplicates(response)
|
119 |
except Exception as e:
|
120 |
+
print(f"Error generating model response: {e}")
|
121 |
return ""
|
122 |
|
123 |
@app.post("/generate")
|
|
|
144 |
print(f"Request error: {e}")
|
145 |
raise HTTPException(status_code=500, detail="Internal Server Error")
|
146 |
|
147 |
+
def remove_repetitive_responses(responses):
|
148 |
+
unique_responses = {}
|
149 |
+
for response in responses:
|
150 |
+
if response['model'] not in unique_responses:
|
151 |
+
unique_responses[response['model']] = response['response']
|
152 |
+
return unique_responses
|
153 |
+
|
154 |
if __name__ == "__main__":
|
155 |
uvicorn.run(app, host="0.0.0.0", port=8000)
|