Spaces:

factorstudios
/

NMFL

Runtime error

Factor Studios commited on Aug 15, 2025

Commit

7a9b3ec

verified ·

1 Parent(s): 319082b

Update test_ai_integration_http.py

Files changed (1) hide show

test_ai_integration_http.py CHANGED Viewed

@@ -95,20 +95,19 @@ def test_ai_integration_http():
                 transformers_logger.setLevel(logging.ERROR)
                 try:
-                    # Create pipeline
-                    # Create pipeline with vGPU device
                     pipe = pipeline(
                         "text-generation",
                         model=model_id,
-                        torch_dtype=torch.float32,  # Use full precision,
                         use_safetensors=True,
                         trust_remote_code=True,
-                        device=device
                     )
-                    pipe.model.eval()
-                    # Move pipeline model to vGPU
                     status['model_on_vgpu'] = True
                     # Log model details

                 transformers_logger.setLevel(logging.ERROR)
                 try:
+                    # Create pipeline with model directly on vGPU
                     pipe = pipeline(
                         "text-generation",
                         model=model_id,
+                        model_kwargs={
+                            "torch_dtype": torch.float32,  # Use full precision
+                            "device_map": {"": device},  # Map all modules to our vGPU device
+                        },
                         use_safetensors=True,
                         trust_remote_code=True,
+                        device=device  # Use our vGPU device
                     )
+                    status["pipeline_loaded"] = True
                     status['model_on_vgpu'] = True
                     # Log model details