Spaces:

AlsuGibadullina
/

TestRefactoringModels

Sleeping

App Files Files Community

AlsuGibadullina commited on Feb 14

Commit

16ecc2a

verified ·

1 Parent(s): 70d4442

Update src/backends.py

Browse files

Files changed (1) hide show

src/backends.py +27 -5

src/backends.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import os
 from dataclasses import dataclass
-from typing import Optional, Dict, Any, Union
 from huggingface_hub import InferenceClient
 try:
@@ -9,8 +10,17 @@ except Exception:
     Image = None
 @dataclass
 class HFInferenceAPIBackend:
     model_id: str
     token: Optional[str] = None
     timeout_s: int = 180
@@ -23,8 +33,9 @@ class HFInferenceAPIBackend:
         temperature = float(params.get("temperature", 0.2))
         max_new_tokens = int(params.get("max_new_tokens", 600))
         top_p = float(params.get("top_p", 0.95))
-        # Chat when possible
         try:
             messages = []
             if system:
@@ -40,19 +51,30 @@ class HFInferenceAPIBackend:
             )
             return resp.choices[0].message.content
         except Exception:
             out = self.client.text_generation(
                 prompt=(f"{system}\n\n{prompt}" if system else prompt),
                 temperature=temperature,
                 max_new_tokens=max_new_tokens,
                 top_p=top_p,
                 do_sample=True,
                 return_full_text=False,
             )
             return out
-    # --- NEW: image -> text (OCR / caption) ---
     def image_to_text(self, image: "Image.Image") -> str:
         """
-        Uses HF task 'image-to-text' for models like TrOCR or BLIP-caption.
         """
-        return self.client.image_to_text(image).generated_text

 import os
 from dataclasses import dataclass
+from typing import Optional, Dict, Any, Protocol
 from huggingface_hub import InferenceClient
 try:
     Image = None
+class LLMBackend(Protocol):
+    def generate(self, prompt: str, *, system: Optional[str], params: Dict[str, Any]) -> str:
+        ...
 @dataclass
 class HFInferenceAPIBackend:
+    """
+    Uses HF Inference API via huggingface_hub.InferenceClient.
+    Works well on Spaces if you provide HF_TOKEN in Secrets.
+    """
     model_id: str
     token: Optional[str] = None
     timeout_s: int = 180
         temperature = float(params.get("temperature", 0.2))
         max_new_tokens = int(params.get("max_new_tokens", 600))
         top_p = float(params.get("top_p", 0.95))
+        repetition_penalty = float(params.get("repetition_penalty", 1.05))
+        # Prefer chat when supported
         try:
             messages = []
             if system:
             )
             return resp.choices[0].message.content
         except Exception:
+            # Fallback: text generation
             out = self.client.text_generation(
                 prompt=(f"{system}\n\n{prompt}" if system else prompt),
                 temperature=temperature,
                 max_new_tokens=max_new_tokens,
                 top_p=top_p,
+                repetition_penalty=repetition_penalty,
                 do_sample=True,
                 return_full_text=False,
             )
             return out
     def image_to_text(self, image: "Image.Image") -> str:
         """
+        HF task 'image-to-text' (captioning / OCR-like depending on model).
         """
+        if Image is None:
+            raise RuntimeError("Pillow not installed")
+        res = self.client.image_to_text(image)
+        # huggingface_hub returns an object with generated_text
+        return getattr(res, "generated_text", str(res))
+def make_backend(backend_type: str, model_id: str) -> LLMBackend:
+    if backend_type == "hf_inference_api":
+        return HFInferenceAPIBackend(model_id=model_id)
+    raise ValueError(f"Unknown backend: {backend_type}")