Spaces:
Configuration error
Configuration error
| package jina | |
| import ( | |
| "github.com/mudler/LocalAI/core/backend" | |
| "github.com/mudler/LocalAI/core/config" | |
| "github.com/gofiber/fiber/v2" | |
| fiberContext "github.com/mudler/LocalAI/core/http/ctx" | |
| "github.com/mudler/LocalAI/core/schema" | |
| "github.com/mudler/LocalAI/pkg/grpc/proto" | |
| "github.com/mudler/LocalAI/pkg/model" | |
| "github.com/rs/zerolog/log" | |
| ) | |
| // JINARerankEndpoint acts like the Jina reranker endpoint (https://jina.ai/reranker/) | |
| // @Summary Reranks a list of phrases by relevance to a given text query. | |
| // @Param request body schema.JINARerankRequest true "query params" | |
| // @Success 200 {object} schema.JINARerankResponse "Response" | |
| // @Router /v1/rerank [post] | |
| func JINARerankEndpoint(cl *config.BackendConfigLoader, ml *model.ModelLoader, appConfig *config.ApplicationConfig) func(c *fiber.Ctx) error { | |
| return func(c *fiber.Ctx) error { | |
| req := new(schema.JINARerankRequest) | |
| if err := c.BodyParser(req); err != nil { | |
| return c.Status(fiber.StatusBadRequest).JSON(fiber.Map{ | |
| "error": "Cannot parse JSON", | |
| }) | |
| } | |
| input := new(schema.TTSRequest) | |
| // Get input data from the request body | |
| if err := c.BodyParser(input); err != nil { | |
| return err | |
| } | |
| modelFile, err := fiberContext.ModelFromContext(c, cl, ml, input.Model, false) | |
| if err != nil { | |
| modelFile = input.Model | |
| log.Warn().Msgf("Model not found in context: %s", input.Model) | |
| } | |
| cfg, err := cl.LoadBackendConfigFileByName(modelFile, appConfig.ModelPath, | |
| config.LoadOptionDebug(appConfig.Debug), | |
| config.LoadOptionThreads(appConfig.Threads), | |
| config.LoadOptionContextSize(appConfig.ContextSize), | |
| config.LoadOptionF16(appConfig.F16), | |
| ) | |
| if err != nil { | |
| modelFile = input.Model | |
| log.Warn().Msgf("Model not found in context: %s", input.Model) | |
| } else { | |
| modelFile = cfg.Model | |
| } | |
| log.Debug().Msgf("Request for model: %s", modelFile) | |
| if input.Backend != "" { | |
| cfg.Backend = input.Backend | |
| } | |
| request := &proto.RerankRequest{ | |
| Query: req.Query, | |
| TopN: int32(req.TopN), | |
| Documents: req.Documents, | |
| } | |
| results, err := backend.Rerank(modelFile, request, ml, appConfig, *cfg) | |
| if err != nil { | |
| return err | |
| } | |
| response := &schema.JINARerankResponse{ | |
| Model: req.Model, | |
| } | |
| for _, r := range results.Results { | |
| response.Results = append(response.Results, schema.JINADocumentResult{ | |
| Index: int(r.Index), | |
| Document: schema.JINAText{Text: r.Text}, | |
| RelevanceScore: float64(r.RelevanceScore), | |
| }) | |
| } | |
| response.Usage.TotalTokens = int(results.Usage.TotalTokens) | |
| response.Usage.PromptTokens = int(results.Usage.PromptTokens) | |
| return c.Status(fiber.StatusOK).JSON(response) | |
| } | |
| } | |