Spaces:
Running
Running
fahmiaziz98
commited on
Commit
·
a23b910
1
Parent(s):
155ad69
[TYPO] fix typo
Browse files
src/api/routers/embedding.py
CHANGED
|
@@ -105,8 +105,8 @@ async def create_embeddings_document(
|
|
| 105 |
)
|
| 106 |
|
| 107 |
logger.info(
|
| 108 |
-
f"Generated {len(request.
|
| 109 |
-
f"in {processing_time:.3f}s ({len(request.
|
| 110 |
)
|
| 111 |
|
| 112 |
return response
|
|
@@ -149,11 +149,11 @@ async def create_sparse_embedding(
|
|
| 149 |
HTTPException: On validation or generation errors
|
| 150 |
"""
|
| 151 |
try:
|
| 152 |
-
validate_texts(request.
|
| 153 |
kwargs = extract_embedding_kwargs(request)
|
| 154 |
|
| 155 |
-
model = manager.get_model(request.
|
| 156 |
-
config = manager.model_configs[request.
|
| 157 |
|
| 158 |
start_time = time.time()
|
| 159 |
|
|
@@ -167,7 +167,7 @@ async def create_sparse_embedding(
|
|
| 167 |
for idx, sparse_result in enumerate(sparse_results):
|
| 168 |
sparse_embeddings.append(
|
| 169 |
SparseEmbedding(
|
| 170 |
-
text=request.
|
| 171 |
indices=sparse_result["indices"],
|
| 172 |
values=sparse_result["values"],
|
| 173 |
)
|
|
@@ -176,14 +176,13 @@ async def create_sparse_embedding(
|
|
| 176 |
response = SparseEmbedResponse(
|
| 177 |
embeddings=sparse_embeddings,
|
| 178 |
count=len(sparse_embeddings),
|
| 179 |
-
|
| 180 |
-
processing_time=processing_time,
|
| 181 |
)
|
| 182 |
|
| 183 |
else:
|
| 184 |
raise HTTPException(
|
| 185 |
status_code=status.HTTP_400_BAD_REQUEST,
|
| 186 |
-
detail=f"Model '{request.
|
| 187 |
)
|
| 188 |
|
| 189 |
logger.info(
|
|
|
|
| 105 |
)
|
| 106 |
|
| 107 |
logger.info(
|
| 108 |
+
f"Generated {len(request.input)} embeddings "
|
| 109 |
+
f"in {processing_time:.3f}s ({len(request.input) / processing_time:.1f} texts/s)"
|
| 110 |
)
|
| 111 |
|
| 112 |
return response
|
|
|
|
| 149 |
HTTPException: On validation or generation errors
|
| 150 |
"""
|
| 151 |
try:
|
| 152 |
+
validate_texts(request.input)
|
| 153 |
kwargs = extract_embedding_kwargs(request)
|
| 154 |
|
| 155 |
+
model = manager.get_model(request.model)
|
| 156 |
+
config = manager.model_configs[request.model]
|
| 157 |
|
| 158 |
start_time = time.time()
|
| 159 |
|
|
|
|
| 167 |
for idx, sparse_result in enumerate(sparse_results):
|
| 168 |
sparse_embeddings.append(
|
| 169 |
SparseEmbedding(
|
| 170 |
+
text=request.input[idx],
|
| 171 |
indices=sparse_result["indices"],
|
| 172 |
values=sparse_result["values"],
|
| 173 |
)
|
|
|
|
| 176 |
response = SparseEmbedResponse(
|
| 177 |
embeddings=sparse_embeddings,
|
| 178 |
count=len(sparse_embeddings),
|
| 179 |
+
model=request.model
|
|
|
|
| 180 |
)
|
| 181 |
|
| 182 |
else:
|
| 183 |
raise HTTPException(
|
| 184 |
status_code=status.HTTP_400_BAD_REQUEST,
|
| 185 |
+
detail=f"Model '{request.model}' is not a sparse model. Type: {config.type}",
|
| 186 |
)
|
| 187 |
|
| 188 |
logger.info(
|
src/models/schemas/requests.py
CHANGED
|
@@ -130,7 +130,7 @@ class RerankRequest(BaseEmbedRequest):
|
|
| 130 |
class Config:
|
| 131 |
json_schema_extra = {
|
| 132 |
"example": {
|
| 133 |
-
"
|
| 134 |
"query": "Python best programming languages for data science",
|
| 135 |
"top_k": 4,
|
| 136 |
"documents": [
|
|
|
|
| 130 |
class Config:
|
| 131 |
json_schema_extra = {
|
| 132 |
"example": {
|
| 133 |
+
"model": "jina-reranker-v3",
|
| 134 |
"query": "Python best programming languages for data science",
|
| 135 |
"top_k": 4,
|
| 136 |
"documents": [
|