|
from __future__ import annotations |
|
|
|
import json |
|
import asyncio |
|
from aiohttp import ClientSession, ContentTypeError |
|
|
|
from ..typing import AsyncResult, Messages |
|
from .base_provider import AsyncGeneratorProvider, ProviderModelMixin |
|
from ..requests.aiohttp import get_connector |
|
from ..requests.raise_for_status import raise_for_status |
|
from .helper import format_prompt |
|
from ..image import ImageResponse |
|
|
|
class ReplicateHome(AsyncGeneratorProvider, ProviderModelMixin): |
|
url = "https://replicate.com" |
|
api_endpoint = "https://homepage.replicate.com/api/prediction" |
|
working = True |
|
supports_stream = True |
|
supports_system_message = True |
|
supports_message_history = True |
|
|
|
default_model = 'yorickvp/llava-13b' |
|
|
|
image_models = [ |
|
'stability-ai/stable-diffusion-3', |
|
'bytedance/sdxl-lightning-4step', |
|
'playgroundai/playground-v2.5-1024px-aesthetic', |
|
] |
|
|
|
text_models = [ |
|
'meta/meta-llama-3-70b-instruct', |
|
'mistralai/mixtral-8x7b-instruct-v0.1', |
|
'google-deepmind/gemma-2b-it', |
|
'yorickvp/llava-13b', |
|
] |
|
|
|
models = text_models + image_models |
|
|
|
model_aliases = { |
|
|
|
"sd-3": "stability-ai/stable-diffusion-3", |
|
"sdxl": "bytedance/sdxl-lightning-4step", |
|
"playground-v2.5": "playgroundai/playground-v2.5-1024px-aesthetic", |
|
|
|
|
|
"gemma-2b": "google-deepmind/gemma-2b-it", |
|
"llava-13b": "yorickvp/llava-13b", |
|
} |
|
|
|
model_versions = { |
|
|
|
'stability-ai/stable-diffusion-3': "527d2a6296facb8e47ba1eaf17f142c240c19a30894f437feee9b91cc29d8e4f", |
|
'bytedance/sdxl-lightning-4step': "5f24084160c9089501c1b3545d9be3c27883ae2239b6f412990e82d4a6210f8f", |
|
'playgroundai/playground-v2.5-1024px-aesthetic': "a45f82a1382bed5c7aeb861dac7c7d191b0fdf74d8d57c4a0e6ed7d4d0bf7d24", |
|
|
|
|
|
"google-deepmind/gemma-2b-it": "dff94eaf770e1fc211e425a50b51baa8e4cac6c39ef074681f9e39d778773626", |
|
"yorickvp/llava-13b": "80537f9eead1a5bfa72d5ac6ea6414379be41d4d4f6679fd776e9535d1eb58bb", |
|
} |
|
|
|
@classmethod |
|
async def create_async_generator( |
|
cls, |
|
model: str, |
|
messages: Messages, |
|
prompt: str = None, |
|
proxy: str = None, |
|
**kwargs |
|
) -> AsyncResult: |
|
model = cls.get_model(model) |
|
|
|
headers = { |
|
"accept": "*/*", |
|
"accept-language": "en-US,en;q=0.9", |
|
"cache-control": "no-cache", |
|
"content-type": "application/json", |
|
"origin": "https://replicate.com", |
|
"pragma": "no-cache", |
|
"priority": "u=1, i", |
|
"referer": "https://replicate.com/", |
|
"sec-ch-ua": '"Not;A=Brand";v="24", "Chromium";v="128"', |
|
"sec-ch-ua-mobile": "?0", |
|
"sec-ch-ua-platform": '"Linux"', |
|
"sec-fetch-dest": "empty", |
|
"sec-fetch-mode": "cors", |
|
"sec-fetch-site": "same-site", |
|
"user-agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/128.0.0.0 Safari/537.36" |
|
} |
|
|
|
async with ClientSession(headers=headers, connector=get_connector(proxy=proxy)) as session: |
|
if prompt is None: |
|
if model in cls.image_models: |
|
prompt = messages[-1]['content'] |
|
else: |
|
prompt = format_prompt(messages) |
|
|
|
data = { |
|
"model": model, |
|
"version": cls.model_versions[model], |
|
"input": {"prompt": prompt}, |
|
} |
|
|
|
async with session.post(cls.api_endpoint, json=data) as response: |
|
await raise_for_status(response) |
|
result = await response.json() |
|
prediction_id = result['id'] |
|
|
|
poll_url = f"https://homepage.replicate.com/api/poll?id={prediction_id}" |
|
max_attempts = 30 |
|
delay = 5 |
|
for _ in range(max_attempts): |
|
async with session.get(poll_url) as response: |
|
await raise_for_status(response) |
|
try: |
|
result = await response.json() |
|
except ContentTypeError: |
|
text = await response.text() |
|
try: |
|
result = json.loads(text) |
|
except json.JSONDecodeError: |
|
raise ValueError(f"Unexpected response format: {text}") |
|
|
|
if result['status'] == 'succeeded': |
|
if model in cls.image_models: |
|
image_url = result['output'][0] |
|
yield ImageResponse(image_url, prompt) |
|
return |
|
else: |
|
for chunk in result['output']: |
|
yield chunk |
|
break |
|
elif result['status'] == 'failed': |
|
raise Exception(f"Prediction failed: {result.get('error')}") |
|
await asyncio.sleep(delay) |
|
|
|
if result['status'] != 'succeeded': |
|
raise Exception("Prediction timed out") |
|
|