Spaces:

onnx-community
/

convert-to-onnx

Running

Felladrin commited on 29 days ago

Commit

548f210

1 Parent(s): 320c9ad

Allow users to decide if they want to base the 'task' argument from the

conversion script on the model's pipeline tag

Because some models (e.g. "Norm/nougat-latex-base") can only be
converted with this option enabled.

Files changed (1) hide show

app.py +22 -0

app.py CHANGED Viewed

@@ -309,6 +309,7 @@ class ModelConverter:
         input_model_id: str,
         trust_remote_code: bool = False,
         output_attentions: bool = False,
     ) -> Tuple[bool, Optional[str]]:
         """Convert a Hugging Face model to ONNX format.
@@ -316,6 +317,7 @@ class ModelConverter:
             input_model_id: Hugging Face model repository ID
             trust_remote_code: Whether to trust and execute remote code from the model
             output_attentions: Whether to output attention weights (required for some tasks)
         Returns:
             Tuple containing:
@@ -337,6 +339,18 @@ class ModelConverter:
             if output_attentions:
                 conversion_args.append("--output_attentions")
             # Run the conversion
             result = self._run_conversion_subprocess(
                 input_model_id, extra_args=conversion_args or None
@@ -521,6 +535,13 @@ def main():
                 "Whether to output attentions from the Whisper model. This is required for word-level (token) timestamps."
             )
         # Determine output repository
         # If user owns the model, allow uploading to the same repo
         if config.hf_username == input_model_id.split("/")[0]:
@@ -559,6 +580,7 @@ def main():
                 input_model_id,
                 trust_remote_code=trust_remote_code,
                 output_attentions=output_attentions,
             )
             if not success:
                 st.error(f"Conversion failed: {stderr}")

         input_model_id: str,
         trust_remote_code: bool = False,
         output_attentions: bool = False,
+        enable_task_inference: bool = True,
     ) -> Tuple[bool, Optional[str]]:
         """Convert a Hugging Face model to ONNX format.
             input_model_id: Hugging Face model repository ID
             trust_remote_code: Whether to trust and execute remote code from the model
             output_attentions: Whether to output attention weights (required for some tasks)
+            enable_task_inference: Whether to pass the task argument to the conversion script based on the model's pipeline tag
         Returns:
             Tuple containing:
             if output_attentions:
                 conversion_args.append("--output_attentions")
+            if enable_task_inference:
+                try:
+                    info = model_info(
+                        repo_id=input_model_id, token=self.config.hf_token
+                    )
+                    pipeline_tag = getattr(info, "pipeline_tag", None)
+                    task = self._normalize_pipeline_tag(pipeline_tag)
+                    if task:
+                        conversion_args.extend(["--task", task])
+                except Exception:
+                    pass
             # Run the conversion
             result = self._run_conversion_subprocess(
                 input_model_id, extra_args=conversion_args or None
                 "Whether to output attentions from the Whisper model. This is required for word-level (token) timestamps."
             )
+        # Optional: Task inference toggle
+        enable_task_inference = st.toggle(
+            "Optional: Base the 'task' argument from the conversion script on the model's pipeline tag",
+            value=False,
+            help="This can make the conversion of some models work, but may cause issues for others. It's recommended to first try converting the model with this option disabled, and only enable it if the conversion fails.",
+        )
         # Determine output repository
         # If user owns the model, allow uploading to the same repo
         if config.hf_username == input_model_id.split("/")[0]:
                 input_model_id,
                 trust_remote_code=trust_remote_code,
                 output_attentions=output_attentions,
+                enable_task_inference=enable_task_inference,
             )
             if not success:
                 st.error(f"Conversion failed: {stderr}")