Spaces:

factorstudios
/

INTAI

Sleeping

App Files Files Community

Factor Studios commited on Aug 12, 2025

Commit

b2a7b82

verified ·

1 Parent(s): 3abf206

Upload 2 files

Browse files

Files changed (2) hide show

ai.py +8 -2
test_ai_integration.py +40 -21

ai.py CHANGED Viewed

@@ -138,9 +138,13 @@ class AIAccelerator:
                 raise RuntimeError("VRAM not properly configured")
             # Test tensor core functionality with a small computation
-            test_input = np.array([[1.0, 2.0], [3.0, 4.0]], dtype=np.float32)
             test_result = self.tensor_core_array.matmul(test_input, test_input)
-            if test_result is None or test_result.size == 0:
                 raise RuntimeError("Tensor core test computation failed")
             self.tensor_cores_initialized = True
@@ -698,3 +702,5 @@ class AIAccelerator:
         except Exception as e:
             print(f"[ERROR] WebSocket-based inference failed for idx={idx}: {e}")
             return None

                 raise RuntimeError("VRAM not properly configured")
             # Test tensor core functionality with a small computation
+            test_input = [[1.0, 2.0], [3.0, 4.0]]
+            # Convert input to numpy array if needed
+            if isinstance(test_input, list):
+                test_input = np.array(test_input, dtype=np.float32)
             test_result = self.tensor_core_array.matmul(test_input, test_input)
+            if test_result is None or not isinstance(test_result, (np.ndarray, list)) or len(test_result) == 0:
                 raise RuntimeError("Tensor core test computation failed")
             self.tensor_cores_initialized = True
         except Exception as e:
             print(f"[ERROR] WebSocket-based inference failed for idx={idx}: {e}")
             return None

test_ai_integration.py CHANGED Viewed

@@ -207,40 +207,59 @@ def test_ai_integration():
     ai_accelerators = []
     try:
-        # Use WebSocket connection manager for all chips
-        with websocket_manager() as shared_storage:
-            # Initialize high-performance chip array with WebSocket storage
-            total_sms = 0
-            total_cores = 0
-            # Create optical interconnect for chip communication
-            from gpu_arch import OpticalInterconnect
-            optical_link = OpticalInterconnect(bandwidth_tbps=800, latency_ns=1)
-            # Create shared VRAM instance for all chips
             shared_vram = VirtualVRAM()
-            shared_vram.storage = shared_storage
             for i in range(num_chips):
-                # Configure each chip with unlimited WebSocket storage
-                chip = Chip(chip_id=i, vram_size_gb=None)  # Unlimited WebSocket storage
                 chips.append(chip)
                 # Connect chips in a ring topology
                 if i > 0:
                     chip.connect_chip(chips[i-1], optical_link)
-                # Initialize AI accelerator with shared WebSocket storage
                 ai_accelerator = chip.ai_accelerator
-                ai_accelerator.vram = shared_vram  # Use shared VRAM instance
                 ai_accelerators.append(ai_accelerator)
                 # Load model weights from WebSocket storage (no CPU transfer)
-                ai_accelerator.load_model(model_id, None, None)  # Model already in WebSocket storage
-            # Track total processing units
-            total_sms += chip.num_sms
-            total_cores += chip.num_sms * chip.cores_per_sm
             # Store chip configuration in WebSocket storage
             storage.store_state(f"chips/{i}/config", "state", {

     ai_accelerators = []
     try:
+        # Reuse the existing storage connection from the previous test
+        if not components['storage'] or not components['storage'].wait_for_connection():
+            # If connection lost, try to reconnect
+            with websocket_manager() as shared_storage:
+                if not shared_storage or not shared_storage.wait_for_connection():
+                    raise RuntimeError("Could not establish WebSocket connection")
+                components['storage'] = shared_storage
+        shared_storage = components['storage']
+        # Initialize high-performance chip array with WebSocket storage
+        total_sms = 0
+        total_cores = 0
+        # Create optical interconnect for chip communication
+        from gpu_arch import OpticalInterconnect
+        optical_link = OpticalInterconnect(bandwidth_tbps=800, latency_ns=1)
+        # Reuse existing VRAM instance with shared storage
+        shared_vram = components['vram']
+        if shared_vram is None:
             shared_vram = VirtualVRAM()
+        shared_vram.storage = shared_storage
             for i in range(num_chips):
+                # Configure each chip with shared WebSocket storage
+                chip = Chip(chip_id=i, vram_size_gb=None, storage=shared_storage)
                 chips.append(chip)
                 # Connect chips in a ring topology
                 if i > 0:
                     chip.connect_chip(chips[i-1], optical_link)
+                # Initialize AI accelerator with shared resources
                 ai_accelerator = chip.ai_accelerator
+                ai_accelerator.vram = shared_vram
+                ai_accelerator.storage = shared_storage  # Ensure storage is set
                 ai_accelerators.append(ai_accelerator)
+                # Verify WebSocket connection before loading model
+                if not shared_storage.wait_for_connection():
+                    raise RuntimeError(f"Lost WebSocket connection during chip {i} initialization")
                 # Load model weights from WebSocket storage (no CPU transfer)
+                try:
+                    ai_accelerator.load_model(model_id, None, None)  # Model already in WebSocket storage
+                except Exception as e:
+                    print(f"Warning: Failed to load model on chip {i}: {e}")
+                    continue
+                # Track total processing units
+                total_sms += chip.num_sms
+                total_cores += chip.num_sms * chip.cores_per_sm
             # Store chip configuration in WebSocket storage
             storage.store_state(f"chips/{i}/config", "state", {