alconost
/

translategemma-12b-custom

mrmiku commited on Jan 24

Commit

9d0793e

verified ·

1 Parent(s): b34c972

Upload handler.py with huggingface_hub

Files changed (1) hide show

handler.py CHANGED Viewed

@@ -52,13 +52,14 @@ class EndpointHandler:
         if is_custom_prompt:
             # Custom prompt format for unsupported languages
-            # Use Gemma chat format: <start_of_turn>user\n{instruction} {text}<end_of_turn>\n<start_of_turn>model\n
-            prompt = f"<start_of_turn>user\n{target_lang} {text}<end_of_turn>\n<start_of_turn>model\n"
-            inputs = self.processor.tokenizer(
                 prompt,
                 return_tensors="pt",
                 add_special_tokens=True
-            ).to(self.model.device)
         else:
             # Standard language code: use structured message format
             messages = [

         if is_custom_prompt:
             # Custom prompt format for unsupported languages
+            # Add explicit instruction to return ONLY the translation
+            prompt = f"<start_of_turn>user\n{target_lang} Output only the translation, no explanations.\n\n{text}<end_of_turn>\n<start_of_turn>model\n"
+            tokenized = self.processor.tokenizer(
                 prompt,
                 return_tensors="pt",
                 add_special_tokens=True
+            )
+            inputs = {k: v.to(self.model.device) for k, v in tokenized.items()}
         else:
             # Standard language code: use structured message format
             messages = [