Spaces:

stefanches
/

OpenBIDSifier

Sleeping

App Files Files Community

zuazo commited on Nov 23, 2025

Commit

0f31aa7

1 Parent(s): 135f5f7

Add multi-provider LLM support (OpenAI, Anthropic, Gemini, Databricks, Ollama)

Browse files

Files changed (2) hide show

agent.py +19 -10
gradio-ui.py +117 -27

agent.py CHANGED Viewed

@@ -9,25 +9,34 @@ import prompts
 class BIDSifierAgent:
 	"""Wrapper around OpenAI chat API for step-wise BIDSification."""
-	def __init__(self, *, provider: str, model: str, openai_api_key: Optional[str] = None, temperature: float = 0.2):
 		load_dotenv()
-		if provider=="openai":
-			if model.startswith("gpt-5"): #reasoning model that requires special handling
-				temperature = 1.0
-				lm = dspy.LM(f"{provider}/{model}", api_key=openai_api_key or os.getenv("OPENAI_API_KEY"), temperature = temperature, max_tokens = 40000)
-			else:
-				lm = dspy.LM(f"{provider}/{model}", api_key=openai_api_key or os.getenv("OPENAI_API_KEY"), temperature = temperature, max_tokens = 10000)
 		else:
-			lm = dspy.LM(f"{provider}/{model}", api_key="", max_tokens=10000)
 		dspy.configure(lm=lm)
 		self.llm = lm
 		self.model = model or os.getenv("BIDSIFIER_MODEL", "gpt-4o-mini")
 		self.temperature = temperature
 	def _build_user_prompt(self, step: str, context: Dict[str, Any]) -> str:
 		dataset_xml = context.get("dataset_xml")
 		readme_text = context.get("readme_text")

 class BIDSifierAgent:
 	"""Wrapper around OpenAI chat API for step-wise BIDSification."""
+	def __init__(
+		self, *,
+        provider: str,
+        model: str,
+        api_key: Optional[str] = None,
+		api_base: Optional[str] = None,
+        temperature: Optional[float | None] = 0.2,
+	):
 		load_dotenv()
+		if model.startswith("gpt-5"):  # reasoning model that requires special handling
+			temperature = 1.0
+			max_tokens = 40000
 		else:
+			temperature = None
+			max_tokens = 10000
+		lm = dspy.LM(
+			f"{provider}/{model}",
+			api_key=api_key or os.getenv(f"{provider.upper()}_API_KEY"),
+			temperature=temperature, max_tokens=max_tokens
+		)
 		dspy.configure(lm=lm)
 		self.llm = lm
 		self.model = model or os.getenv("BIDSIFIER_MODEL", "gpt-4o-mini")
 		self.temperature = temperature
 	def _build_user_prompt(self, step: str, context: Dict[str, Any]) -> str:
 		dataset_xml = context.get("dataset_xml")
 		readme_text = context.get("readme_text")

gradio-ui.py CHANGED Viewed

@@ -36,6 +36,47 @@ STEP_LABELS = list(BIDSIFIER_STEPS.keys())
 NUM_STEPS = len(STEP_LABELS)
 # Helpers
 def split_shell_commands(text: str) -> List[str]:
@@ -121,8 +162,33 @@ def build_context(
 # Core callbacks
 def call_bidsifier_step(
-    openai_api_key: str,
     dataset_xml: str,
     readme_text: str,
     publication_text: str,
@@ -137,6 +203,10 @@ def call_bidsifier_step(
     Parameters
     ----------
     dataset_xml : str
         Dataset XML content.
     readme_text : str
@@ -185,7 +255,9 @@ def call_bidsifier_step(
     step_id = BIDSIFIER_STEPS[step_label]
     context = build_context(dataset_xml, readme_text, publication_text, output_root)
-    agent = BIDSifierAgent(provider=provider, model=model, openai_api_key=openai_api_key)
     # Decide whether to use the structured step prompt or a free-form query:
     if manual_prompt.strip():
@@ -204,7 +276,7 @@ def call_bidsifier_step(
         step_index = 0
     state = {
-        "openai_api_key": openai_api_key,
         "dataset_xml": dataset_xml,
         "readme_text": readme_text,
         "publication_text": publication_text,
@@ -217,7 +289,9 @@ def call_bidsifier_step(
         "commands": commands,
     }
-    return llm_output, commands_str, state, step_index
 def confirm_commands(
@@ -288,7 +362,7 @@ def confirm_commands(
     agent = BIDSifierAgent(
         provider=last_state.get("provider", "openai"),
-        model=last_state.get("model", "gpt-4o-mini"),
     )
     llm_output = agent.run_step(next_id, context)
@@ -479,13 +553,6 @@ with gr.Blocks(
         """
     )
-    with gr.Row():
-        openai_key_input = gr.Textbox(
-            label="OpenAI API Key",
-            placeholder="Paste your OpenAI API key here",
-            lines=1,
-            type="password",
-        )
     with gr.Row():
         dataset_xml_file = gr.File(
             label="Upload dataset_structure.xml (optional)",
@@ -509,17 +576,35 @@ with gr.Blocks(
         lines=6,
     )
-    with gr.Accordion("LLM settings (advanced)", open=False):
-        provider_input = gr.Dropdown(
-            label="Provider",
-            choices=["openai"],
-            value="openai",
-        )
-        model_input = gr.Textbox(
-            label="Model",
-            value="gpt-4o-mini",
-            placeholder="e.g., gpt-4o-mini, gpt-5",
         )
     output_root_input = gr.Textbox(
         label="Output root",
@@ -554,10 +639,8 @@ with gr.Blocks(
     call_button = gr.Button("Call BIDSifier", variant="primary")
-    llm_output_box = gr.Textbox(
-        label="Raw BIDSifier output",
-        lines=10,
-        interactive=True,
     )
     commands_box = gr.Textbox(
@@ -578,10 +661,17 @@ with gr.Blocks(
     # Wiring
     call_button.click(
         fn=call_bidsifier_step,
         inputs=[
-            openai_key_input,
             dataset_xml_input,
             readme_input,
             publication_input,

 NUM_STEPS = len(STEP_LABELS)
+PROVIDERS_INFO = {
+    "openai": {
+        "model": "gpt-4o-mini",
+        "doc": "You can authenticate by setting the **API Key** above.",
+    },
+    "anthropic": {
+        "model": "claude-sonnet-4-5-20250929",
+        "doc": "You can authenticate by setting the **API Key** above.",
+    },
+    "databricks": {
+        "model": "databricks-llama-4-maverick",
+        "doc": (
+            "If you're on the Databricks platform, authentication is automatic"
+            " via their SDK. If not, you can set the **API Key** above."
+        ),
+    },
+    "gemini": {
+        "model": "gemini-2.5-flash",
+        "doc": "You can authenticate by setting the **API Key** above.",
+    },
+    "ollama_chat": {
+        "model": "llama3.2:1b",
+        "doc": """
+First, install Ollama and launch its server with your LM:
+```
+> curl -fsSL https://ollama.ai/install.sh | sh
+> ollama run llama3.2:1b
+```
+You can search all the Ollama models here: https://ollama.com/search
+You can also manually input another provider. See the
+[DSPy documentation](https://dspy.ai/api/models/LM/) for other providers and
+local LLMs.
+        """,
+        "key_base": "http://localhost:11434",
+    },
+}
 # Helpers
 def split_shell_commands(text: str) -> List[str]:
 # Core callbacks
+def select_provider(provider: str):
+    """Fills the default provider model base, and description.
+    Parameters
+    ----------
+    provider : str
+        The name of the provider.
+    Returns
+    -------
+    list
+        A list of two values: model name, and provider documentation in MD.
+    """
+    provider = provider.lower()
+    if provider not in PROVIDERS_INFO:
+        return "", "", ""
+    provider_info = PROVIDERS_INFO[provider]
+    return (
+        provider_info.get("model", ""),
+        provider_info.get("key_base", ""),
+        provider_info.get("doc", ""),
+    )
 def call_bidsifier_step(
+    api_key: str,
+    api_base: str,
     dataset_xml: str,
     readme_text: str,
     publication_text: str,
     Parameters
     ----------
+    api_key : str
+        LLM provider API key.
+    api_base : str
+        Local LLM base URL.
     dataset_xml : str
         Dataset XML content.
     readme_text : str
     step_id = BIDSIFIER_STEPS[step_label]
     context = build_context(dataset_xml, readme_text, publication_text, output_root)
+    agent = BIDSifierAgent(
+        provider=provider, model=model, api_key=api_key, api_base=api_base
+    )
     # Decide whether to use the structured step prompt or a free-form query:
     if manual_prompt.strip():
         step_index = 0
     state = {
+        "api_key": api_key,
         "dataset_xml": dataset_xml,
         "readme_text": readme_text,
         "publication_text": publication_text,
         "commands": commands,
     }
+    llm_output_text = "## Raw BIDSifier output\n" + llm_output
+    return llm_output_text, commands_str, state, step_index
 def confirm_commands(
     agent = BIDSifierAgent(
         provider=last_state.get("provider", "openai"),
+        model=last_state.get("model", PROVIDERS_INFO["openai"]["model"]),
     )
     llm_output = agent.run_step(next_id, context)
         """
     )
     with gr.Row():
         dataset_xml_file = gr.File(
             label="Upload dataset_structure.xml (optional)",
         lines=6,
     )
+    with gr.Accordion("LLM settings"):
+        api_key_input = gr.Textbox(
+            label="API Key (OpenAI, Gemini, Anthropic, Databricks)",
+            placeholder=(
+                "Paste your LLM provider API key here."
+                ' See "Advanced settings" to set up non-OpenAI providers.'
+            ),
+            lines=1,
+            type="password",
         )
+        with gr.Accordion("Advanced settings", open=False):
+            default_provider = list(PROVIDERS_INFO.keys())[0]
+            provider_input = gr.Dropdown(
+                label="Provider",
+                choices=PROVIDERS_INFO.keys(),
+                value=default_provider,
+                interactive=True,
+            )
+            model_input = gr.Textbox(
+                label="Model",
+                value=PROVIDERS_INFO[default_provider]["model"],
+                placeholder="e.g., gpt-4o-mini, gpt-5",
+            )
+            api_base_input = gr.Textbox(
+                label="API Base (Local LLMs, other providers)",
+                placeholder="Write your API Base URL here",
+                lines=1,
+            )
+            model_doc = gr.Markdown(PROVIDERS_INFO[default_provider]["doc"])
     output_root_input = gr.Textbox(
         label="Output root",
     call_button = gr.Button("Call BIDSifier", variant="primary")
+    llm_output_box = gr.Markdown(
+        label="Raw BIDSifier output", show_label=True, container=True
     )
     commands_box = gr.Textbox(
     # Wiring
+    provider_input.change(
+        fn=select_provider,
+        inputs=provider_input,
+        outputs=[model_input, api_base_input, model_doc],
+    )
     call_button.click(
         fn=call_bidsifier_step,
         inputs=[
+            api_key_input,
+            api_base_input,
             dataset_xml_input,
             readme_input,
             publication_input,