Spaces:

factorstudios
/

NMFL

Runtime error

App Files Files Community

Factor Studios commited on Aug 14, 2025

Commit

54aca07

verified ·

1 Parent(s): 7670c1d

Update test_ai_integration_http.py

Browse files

Files changed (1) hide show

test_ai_integration_http.py +18 -12

test_ai_integration_http.py CHANGED Viewed

@@ -17,6 +17,10 @@ from torch_vgpu import VGPUDevice, to_vgpu
 def setup_vgpu():
     """Setup vGPU device"""
     try:
         # Create and register vGPU device
         vgpu = VGPUDevice()
         device = vgpu.device()
@@ -96,16 +100,17 @@ def test_ai_integration_http():
                 transformers_logger.setLevel(logging.ERROR)
                 try:
-                    # Create pipeline
                     pipe = pipeline(
                         "text-generation",
                         model=model_id,
-                        torch_dtype="auto",
-                        device=device  # Use our vGPU device
                     )
                     status['pipeline_loaded'] = True
-                    # Move pipeline to vGPU
                     pipe.model = to_vgpu(pipe.model, vram=vram)
                     status['model_on_vgpu'] = True
@@ -131,19 +136,18 @@ def test_ai_integration_http():
             peak_mem = initial_mem
             try:
-                # Prepare messages
-                messages = [
-                    {"role": "user", "content": "Explain how virtual GPUs work in simple terms."}
-                ]
                 with torch.no_grad():
                     # Generate text
                     outputs = pipe(
-                        messages,
                         max_new_tokens=256,
                         temperature=0.7,
                         top_p=0.95,
-                        top_k=40
                     )
                     if hasattr(storage, 'get_used_memory'):
@@ -169,8 +173,10 @@ def test_ai_integration_http():
         finally:
             # Cleanup and status report
             try:
-                del model
-                del outputs
                 torch.cuda.empty_cache() if hasattr(torch, 'cuda') else None
                 status['cleanup_success'] = True
             except Exception as e:

 def setup_vgpu():
     """Setup vGPU device"""
     try:
+        # Register vGPU device type
+        if not hasattr(torch, 'vgpu'):
+            torch.register_privateuseone_backend()
         # Create and register vGPU device
         vgpu = VGPUDevice()
         device = vgpu.device()
                 transformers_logger.setLevel(logging.ERROR)
                 try:
+                    # Create pipeline and manually move to vGPU
                     pipe = pipeline(
                         "text-generation",
                         model=model_id,
+                        torch_dtype=torch.float32,
+                        device_map=None  # Don't auto-place on devices
                     )
                     status['pipeline_loaded'] = True
+                    # Move model to vGPU
+                    pipe.model = pipe.model.to(device)
                     pipe.model = to_vgpu(pipe.model, vram=vram)
                     status['model_on_vgpu'] = True
             peak_mem = initial_mem
             try:
+                # Prepare input text
+                text = "Explain how virtual GPUs work in simple terms."
                 with torch.no_grad():
                     # Generate text
                     outputs = pipe(
+                        text,
                         max_new_tokens=256,
                         temperature=0.7,
                         top_p=0.95,
+                        top_k=40,
+                        do_sample=True
                     )
                     if hasattr(storage, 'get_used_memory'):
         finally:
             # Cleanup and status report
             try:
+                if 'pipe' in locals():
+                    del pipe
+                if 'outputs' in locals():
+                    del outputs
                 torch.cuda.empty_cache() if hasattr(torch, 'cuda') else None
                 status['cleanup_success'] = True
             except Exception as e: