File size: 1,196 Bytes
8746c2a
 
 
 
 
 
 
 
 
 
 
 
 
ef69607
 
8746c2a
 
 
 
 
 
 
 
2ff8862
 
8746c2a
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
from typing import Any, List

from openai import AsyncAzureOpenAI, AzureOpenAI

from ...utils.registry import registry
from .base import EncoderBase


@registry.register_encoder()
class AzureTextEmbeddingV3(EncoderBase):
    model_id: str = "text-embedding-3-large"
    api_key: str
    dim: int = 3072
    api_version: str
    
    class Config:
        """Configuration for this pydantic object."""

        protected_namespaces = ()
        extra = "allow"

    def __init__(self, /, **data: Any) -> None:
        super().__init__(**data)
        self.client = AzureOpenAI(azure_endpoint=self.endpoint, api_key=self.api_key, api_version=self.api_version)
        self.aclient = AsyncAzureOpenAI(azure_endpoint=self.endpoint, api_key=self.api_key, api_version=self.api_version)

    def _infer(self, data: List[str], **kwargs) -> List[List[float]]:
        res = self.client.embeddings.create(input=data, model=self.model_id)
        return [item.embedding for item in res.data]

    async def _ainfer(self, data: List[str], **kwargs) -> List[List[float]]:
        res = await self.aclient.embeddings.create(input=data, model=self.model_id)
        return [item.embedding for item in res.data]