|
package jina |
|
|
|
import ( |
|
"github.com/mudler/LocalAI/core/backend" |
|
"github.com/mudler/LocalAI/core/config" |
|
|
|
"github.com/gofiber/fiber/v2" |
|
fiberContext "github.com/mudler/LocalAI/core/http/ctx" |
|
"github.com/mudler/LocalAI/core/schema" |
|
"github.com/mudler/LocalAI/pkg/grpc/proto" |
|
"github.com/mudler/LocalAI/pkg/model" |
|
"github.com/rs/zerolog/log" |
|
) |
|
|
|
|
|
|
|
|
|
|
|
|
|
func JINARerankEndpoint(cl *config.BackendConfigLoader, ml *model.ModelLoader, appConfig *config.ApplicationConfig) func(c *fiber.Ctx) error { |
|
return func(c *fiber.Ctx) error { |
|
req := new(schema.JINARerankRequest) |
|
if err := c.BodyParser(req); err != nil { |
|
return c.Status(fiber.StatusBadRequest).JSON(fiber.Map{ |
|
"error": "Cannot parse JSON", |
|
}) |
|
} |
|
|
|
input := new(schema.TTSRequest) |
|
|
|
|
|
if err := c.BodyParser(input); err != nil { |
|
return err |
|
} |
|
|
|
modelFile, err := fiberContext.ModelFromContext(c, cl, ml, input.Model, false) |
|
if err != nil { |
|
modelFile = input.Model |
|
log.Warn().Msgf("Model not found in context: %s", input.Model) |
|
} |
|
|
|
cfg, err := cl.LoadBackendConfigFileByName(modelFile, appConfig.ModelPath, |
|
config.LoadOptionDebug(appConfig.Debug), |
|
config.LoadOptionThreads(appConfig.Threads), |
|
config.LoadOptionContextSize(appConfig.ContextSize), |
|
config.LoadOptionF16(appConfig.F16), |
|
) |
|
|
|
if err != nil { |
|
modelFile = input.Model |
|
log.Warn().Msgf("Model not found in context: %s", input.Model) |
|
} else { |
|
modelFile = cfg.Model |
|
} |
|
log.Debug().Msgf("Request for model: %s", modelFile) |
|
|
|
if input.Backend != "" { |
|
cfg.Backend = input.Backend |
|
} |
|
|
|
request := &proto.RerankRequest{ |
|
Query: req.Query, |
|
TopN: int32(req.TopN), |
|
Documents: req.Documents, |
|
} |
|
|
|
results, err := backend.Rerank(cfg.Backend, modelFile, request, ml, appConfig, *cfg) |
|
if err != nil { |
|
return err |
|
} |
|
|
|
response := &schema.JINARerankResponse{ |
|
Model: req.Model, |
|
} |
|
|
|
for _, r := range results.Results { |
|
response.Results = append(response.Results, schema.JINADocumentResult{ |
|
Index: int(r.Index), |
|
Document: schema.JINAText{Text: r.Text}, |
|
RelevanceScore: float64(r.RelevanceScore), |
|
}) |
|
} |
|
|
|
response.Usage.TotalTokens = int(results.Usage.TotalTokens) |
|
response.Usage.PromptTokens = int(results.Usage.PromptTokens) |
|
|
|
return c.Status(fiber.StatusOK).JSON(response) |
|
} |
|
} |
|
|