File size: 9,530 Bytes
381d345
 
 
 
 
3f3cdfd
40c87d6
fec555d
381d345
 
 
 
 
 
 
 
 
 
b63ba8d
381d345
d47936e
381d345
 
 
 
3f3cdfd
 
5514c6a
381d345
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
589c428
381d345
 
b63ba8d
7e61071
 
 
 
 
 
381d345
b8e584a
381d345
 
 
 
 
 
 
 
 
 
0b65cb8
381d345
 
0b65cb8
381d345
 
 
 
 
0b65cb8
381d345
 
 
 
 
 
dde279d
381d345
c2431bf
381d345
 
 
0b65cb8
381d345
 
 
 
 
 
 
 
0b65cb8
381d345
 
0b65cb8
381d345
 
0b65cb8
cb310c2
381d345
 
0b65cb8
381d345
1fe1d3e
 
381d345
 
 
 
1fe1d3e
 
381d345
1fe1d3e
381d345
1fe1d3e
 
0b65cb8
1fe1d3e
3f3cdfd
1fe1d3e
0b65cb8
1fe1d3e
 
51edae9
cb310c2
51edae9
0b65cb8
cb310c2
0eb0c17
0b65cb8
 
1fe1d3e
381d345
 
 
 
 
0b65cb8
381d345
 
b8e584a
381d345
 
 
 
 
 
 
 
 
 
b8e584a
381d345
fec555d
5514c6a
381d345
 
 
 
 
5514c6a
381d345
 
 
 
 
 
dde279d
381d345
c2431bf
381d345
 
 
5514c6a
381d345
 
 
 
 
 
 
 
5514c6a
381d345
cfe381f
5514c6a
381d345
 
06ff1c4
 
381d345
 
5514c6a
3f3cdfd
 
 
8cd6e35
381d345
 
 
 
5514c6a
381d345
b63ba8d
381d345
 
 
 
 
 
 
 
8cd6e35
3f3cdfd
 
 
381d345
 
 
 
 
 
 
 
 
 
 
 
 
65e5192
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
from datetime import datetime
import json
import uuid
import asyncio
import random
import os
from typing import Any, Dict, Optional

import httpx
from fastapi import HTTPException
from api.config import (
    MODEL_MAPPING,
    get_headers_api_chat,
    BASE_URL,
    AGENT_MODE,
    TRENDING_AGENT_MODE,
    MODEL_PREFIXES,
)
from api.models import ChatRequest
from api.logger import setup_logger
from api.validate import getHid

logger = setup_logger(__name__)

BLOCKED_MESSAGE = "Generated by BLACKBOX.AI, try unlimited chat https://www.blackbox.ai"
ADVERTISEMENT_TEXT = os.getenv("ADVERTISEMENT_TEXT", "")

def create_chat_completion_data(content: str, model: str, timestamp: int, finish_reason: Optional[str] = None) -> Dict[str, Any]:
    return {
        "id": f"chatcmpl-{uuid.uuid4()}",
        "object": "chat.completion.chunk",
        "created": timestamp,
        "model": model,
        "choices": [
            {
                "index": 0,
                "delta": {"content": content, "role": "assistant"},
                "finish_reason": finish_reason,
            }
        ],
        "usage": None,
    }

def message_to_dict(message, model_prefix: Optional[str] = None):
    content = message.content if isinstance(message.content, str) else message.content[0]["text"]
    if model_prefix:
        content = f"{model_prefix} {content}"
    return {"role": message.role, "content": content}

def strip_model_prefix(content: str, model_prefix: Optional[str] = None) -> str:
    if model_prefix and content.startswith(model_prefix):
        logger.debug(f"Stripping prefix '{model_prefix}' from content.")
        return content[len(model_prefix):].strip()
    return content

# Process streaming response with headers from config.py
async def process_streaming_response(request: ChatRequest):
    request_id = f"chatcmpl-{uuid.uuid4()}"
    logger.info(f"Processing request with ID: {request_id} - Model: {request.model}")

    agent_mode = AGENT_MODE.get(request.model, {})
    trending_agent_mode = TRENDING_AGENT_MODE.get(request.model, {})
    model_prefix = MODEL_PREFIXES.get(request.model, "")

    headers_api_chat = get_headers_api_chat(BASE_URL)

    # Delay for 'o1-preview' model if necessary
    if request.model == 'o1-preview':
        delay_seconds = random.randint(1, 60)
        logger.info(f"Introducing a delay of {delay_seconds} seconds for model 'o1-preview' (Request ID: {request_id})")
        await asyncio.sleep(delay_seconds)

    h_value = await getHid()
    if not h_value:
        logger.error("Failed to retrieve h-value for validation.")
        raise HTTPException(status_code=500, detail="Validation failed due to missing h-value.")

    json_data = {
        "agentMode": agent_mode,
        "clickedAnswer2": False,
        "clickedAnswer3": False,
        "clickedForceWebSearch": False,
        "codeModelMode": True,
        "githubToken": None,
        "id": None,
        "isChromeExt": False,
        "isMicMode": False,
        "maxTokens": request.max_tokens,
        "messages": [message_to_dict(msg, model_prefix=model_prefix) for msg in request.messages],
        "mobileClient": False,
        "playgroundTemperature": request.temperature,
        "playgroundTopP": request.top_p,
        "previewToken": None,
        "trendingAgentMode": trending_agent_mode,
        "userId": None,
        "userSelectedModel": MODEL_MAPPING.get(request.model, request.model),
        "userSystemPrompt": None,
        "validated": h_value,
        "visitFromDelta": False,
        "webSearchModePrompt": False,
        "imageGenerationMode": False,
    }

    advertisement_added = False  # Track if advertisement is already added

    async with httpx.AsyncClient() as client:
        try:
            async with client.stream("POST", f"{BASE_URL}/api/chat", headers=headers_api_chat, json=json_data, timeout=100) as response:
                response.raise_for_status()

                timestamp = int(datetime.now().timestamp())
                async for chunk in response.aiter_text():
                    if chunk:
                        content = chunk
                        if content.startswith("$@$v=undefined-rv1$@$"):
                            content = content[21:]  # Remove unwanted prefix

                        if BLOCKED_MESSAGE in content:
                            logger.info(f"Blocked message detected in response for Request ID {request_id}.")
                            content = content.replace(BLOCKED_MESSAGE, '').strip()

                        if not content:
                            continue  # Skip empty content

                        cleaned_content = strip_model_prefix(content, model_prefix)

                        # Yield cleaned chunk as part of the stream
                        yield f"data: {json.dumps(create_chat_completion_data(cleaned_content, request.model, timestamp))}\n\n"

                # Append markdown separator and advertisement as a separate chunk
                if ADVERTISEMENT_TEXT and not advertisement_added:
                    advertisement_with_line_break = "\n---\n" + ADVERTISEMENT_TEXT  # Add the markdown horizontal rule
                    yield f"data: {json.dumps(create_chat_completion_data(advertisement_with_line_break, request.model, timestamp))}\n\n"
                    advertisement_added = True

                # Yield final chunk indicating the end of the stream
                yield f"data: {json.dumps(create_chat_completion_data('', request.model, timestamp, 'stop'))}\n\n"
                yield "data: [DONE]\n\n"

        except httpx.HTTPStatusError as e:
            logger.error(f"HTTP error occurred for Request ID {request_id}: {e}")
            raise HTTPException(status_code=e.response.status_code, detail=str(e))
        except httpx.RequestError as e:
            logger.error(f"Request error occurred for Request ID {request_id}: {e}")
            raise HTTPException(status_code=500, detail=str(e))

# Process non-streaming response with headers from config.py
async def process_non_streaming_response(request: ChatRequest):
    request_id = f"chatcmpl-{uuid.uuid4()}"
    logger.info(f"Processing request with ID: {request_id} - Model: {request.model}")

    agent_mode = AGENT_MODE.get(request.model, {})
    trending_agent_mode = TRENDING_AGENT_MODE.get(request.model, {})
    model_prefix = MODEL_PREFIXES.get(request.model, "")

    headers_api_chat = get_headers_api_chat(BASE_URL)

    # Delay for 'o1-preview' model if necessary
    if request.model == 'o1-preview':
        delay_seconds = random.randint(20, 60)
        logger.info(f"Introducing a delay of {delay_seconds} seconds for model 'o1-preview' (Request ID: {request_id})")
        await asyncio.sleep(delay_seconds)

    h_value = await getHid()
    if not h_value:
        logger.error("Failed to retrieve h-value for validation.")
        raise HTTPException(status_code=500, detail="Validation failed due to missing h-value.")

    json_data = {
        "agentMode": agent_mode,
        "clickedAnswer2": False,
        "clickedAnswer3": False,
        "clickedForceWebSearch": False,
        "codeModelMode": True,
        "githubToken": None,
        "id": None,
        "isChromeExt": False,
        "isMicMode": False,
        "maxTokens": request.max_tokens,
        "messages": [message_to_dict(msg, model_prefix=model_prefix) for msg in request.messages],
        "mobileClient": False,
        "playgroundTemperature": request.temperature,
        "playgroundTopP": request.top_p,
        "previewToken": None,
        "trendingAgentMode": trending_agent_mode,
        "userId": None,
        "userSelectedModel": MODEL_MAPPING.get(request.model, request.model),
        "userSystemPrompt": None,
        "validated": h_value,
        "visitFromDelta": False,
        "webSearchModePrompt": False,
        "imageGenerationMode": False,
    }

    full_response = ""  # Store full non-streaming response content

    async with httpx.AsyncClient() as client:
        try:
            async with client.stream("POST", f"{BASE_URL}/api/chat", headers=headers_api_chat, json=json_data) as response:
                response.raise_for_status()
                async for chunk in response.aiter_text():
                    full_response += chunk

        except httpx.HTTPStatusError as e:
            logger.error(f"HTTP error occurred for Request ID {request_id}: {e}")
            raise HTTPException(status_code=e.response.status_code, detail=str(e))
        except httpx.RequestError as e:
            logger.error(f"Request error occurred for Request ID {request_id}: {e}")
            raise HTTPException(status_code=500, detail=str(e))

    if full_response.startswith("$@$v=undefined-rv1$@$"):
        full_response = full_response[21:]

    if BLOCKED_MESSAGE in full_response:
        full_response = full_response.replace(BLOCKED_MESSAGE, '').strip()

    cleaned_full_response = strip_model_prefix(full_response, model_prefix)

    # Append advertisement once
    if ADVERTISEMENT_TEXT:
        cleaned_full_response += "\n\n" + ADVERTISEMENT_TEXT

    return {
        "id": f"chatcmpl-{uuid.uuid4()}",
        "object": "chat.completion",
        "created": int(datetime.now().timestamp()),
        "model": request.model,
        "choices": [
            {
                "index": 0,
                "message": {"role": "assistant", "content": cleaned_full_response},
                "finish_reason": "stop",
            }
        ],
        "usage": None,
    }