Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -423,76 +423,62 @@ print("Pipeline initialized!")
|
|
| 423 |
print("=" * 80)
|
| 424 |
|
| 425 |
# =============================================================================
|
| 426 |
-
# ZeroGPU Tensor Preloading -
|
| 427 |
# =============================================================================
|
|
|
|
|
|
|
|
|
|
|
|
|
| 428 |
|
| 429 |
-
print("Preloading
|
| 430 |
-
|
| 431 |
-
# =====
|
| 432 |
-
print("
|
| 433 |
-
|
| 434 |
-
|
| 435 |
-
|
| 436 |
-
|
| 437 |
-
|
| 438 |
-
|
| 439 |
-
|
| 440 |
-
|
| 441 |
-
|
| 442 |
-
|
| 443 |
-
|
| 444 |
-
|
| 445 |
-
|
| 446 |
-
|
| 447 |
-
|
| 448 |
-
|
| 449 |
-
|
| 450 |
-
|
| 451 |
-
|
| 452 |
-
|
| 453 |
-
|
| 454 |
-
|
| 455 |
-
|
| 456 |
-
|
| 457 |
-
|
| 458 |
-
|
| 459 |
-
|
| 460 |
-
|
| 461 |
-
|
| 462 |
-
print("
|
| 463 |
-
|
| 464 |
-
# =====
|
| 465 |
-
print("
|
| 466 |
-
|
| 467 |
-
|
| 468 |
-
|
| 469 |
-
|
| 470 |
-
|
| 471 |
-
|
| 472 |
-
|
| 473 |
-
|
| 474 |
-
|
| 475 |
-
|
| 476 |
-
|
| 477 |
-
|
| 478 |
-
_video_encoder2 = _orig_video_encoder_factory2()
|
| 479 |
-
_video_decoder2 = _orig_video_decoder_factory2()
|
| 480 |
-
_audio_decoder2 = _orig_audio_decoder_factory2()
|
| 481 |
-
_vocoder2 = _orig_vocoder_factory2()
|
| 482 |
-
_spatial_upsampler2 = _orig_spatial_upsampler_factory2()
|
| 483 |
-
_text_encoder2 = _orig_text_encoder_factory2()
|
| 484 |
-
_embeddings_processor2 = _orig_gemma_embeddings_factory2()
|
| 485 |
-
|
| 486 |
-
ledger2.transformer = lambda: _transformer2
|
| 487 |
-
ledger2.video_encoder = lambda: _video_encoder2
|
| 488 |
-
ledger2.video_decoder = lambda: _video_decoder2
|
| 489 |
-
ledger2.audio_decoder = lambda: _audio_decoder2
|
| 490 |
-
ledger2.vocoder = lambda: _vocoder2
|
| 491 |
-
ledger2.spatial_upsampler = lambda: _spatial_upsampler2
|
| 492 |
-
ledger2.text_encoder = lambda: _text_encoder2
|
| 493 |
-
ledger2.gemma_embeddings_processor = lambda: _embeddings_processor2
|
| 494 |
-
|
| 495 |
-
print(" Stage 2 models preloaded")
|
| 496 |
|
| 497 |
print("All models preloaded for ZeroGPU tensor packing!")
|
| 498 |
print("=" * 80)
|
|
|
|
| 423 |
print("=" * 80)
|
| 424 |
|
| 425 |
# =============================================================================
|
| 426 |
+
# ZeroGPU Tensor Preloading - Only Stage-Specific Transformers
|
| 427 |
# =============================================================================
|
| 428 |
+
# Many components are SHARED between stage 1 and stage 2:
|
| 429 |
+
# - video_encoder, text_encoder (Gemma), audio_encoder, vocoder, embeddings_processor
|
| 430 |
+
# These only need to be loaded ONCE.
|
| 431 |
+
# Only the TRANSFORMER is different per stage (different LoRA weights).
|
| 432 |
|
| 433 |
+
print("Preloading models for ZeroGPU tensor packing...")
|
| 434 |
+
|
| 435 |
+
# ===== Preload SHARED components (load once, share) =====
|
| 436 |
+
print(" Loading shared components...")
|
| 437 |
+
shared_ledger = pipeline.stage_1_model_ledger
|
| 438 |
+
|
| 439 |
+
# These are shared - load once from stage 1
|
| 440 |
+
_video_encoder = shared_ledger.video_encoder()
|
| 441 |
+
shared_ledger.video_encoder = lambda: _video_encoder
|
| 442 |
+
|
| 443 |
+
_text_encoder = shared_ledger.text_encoder()
|
| 444 |
+
shared_ledger.text_encoder = lambda: _text_encoder
|
| 445 |
+
|
| 446 |
+
_embeddings_processor = shared_ledger.gemma_embeddings_processor()
|
| 447 |
+
shared_ledger.gemma_embeddings_processor = lambda: _embeddings_processor
|
| 448 |
+
|
| 449 |
+
_audio_decoder = shared_ledger.audio_decoder()
|
| 450 |
+
shared_ledger.audio_decoder = lambda: _audio_decoder
|
| 451 |
+
|
| 452 |
+
_vocoder = shared_ledger.vocoder()
|
| 453 |
+
shared_ledger.vocoder = lambda: _vocoder
|
| 454 |
+
|
| 455 |
+
_spatial_upsampler = shared_ledger.spatial_upsampler()
|
| 456 |
+
shared_ledger.spatial_upsampler = lambda: _spatial_upsampler
|
| 457 |
+
|
| 458 |
+
# Point stage 2 to same shared components
|
| 459 |
+
pipeline.stage_2_model_ledger.video_encoder = lambda: _video_encoder
|
| 460 |
+
pipeline.stage_2_model_ledger.text_encoder = lambda: _text_encoder
|
| 461 |
+
pipeline.stage_2_model_ledger.gemma_embeddings_processor = lambda: _embeddings_processor
|
| 462 |
+
pipeline.stage_2_model_ledger.audio_decoder = lambda: _audio_decoder
|
| 463 |
+
pipeline.stage_2_model_ledger.vocoder = lambda: _vocoder
|
| 464 |
+
pipeline.stage_2_model_ledger.spatial_upsampler = lambda: _spatial_upsampler
|
| 465 |
+
|
| 466 |
+
print(" Shared components preloaded")
|
| 467 |
+
|
| 468 |
+
# ===== Preload UNIQUE transformers per stage =====
|
| 469 |
+
print(" Loading stage 1 transformer...")
|
| 470 |
+
_transformer1 = pipeline.stage_1_model_ledger.transformer()
|
| 471 |
+
pipeline.stage_1_model_ledger.transformer = lambda: _transformer1
|
| 472 |
+
|
| 473 |
+
print(" Loading stage 2 transformer...")
|
| 474 |
+
_transformer2 = pipeline.stage_2_model_ledger.transformer()
|
| 475 |
+
pipeline.stage_2_model_ledger.transformer = lambda: _transformer2
|
| 476 |
+
|
| 477 |
+
# ===== Preload video_decoder (may be shared, but preload for safety) =====
|
| 478 |
+
print(" Loading video decoder...")
|
| 479 |
+
_video_decoder1 = shared_ledger.video_decoder()
|
| 480 |
+
shared_ledger.video_decoder = lambda: _video_decoder1
|
| 481 |
+
pipeline.stage_2_model_ledger.video_decoder = lambda: _video_decoder1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 482 |
|
| 483 |
print("All models preloaded for ZeroGPU tensor packing!")
|
| 484 |
print("=" * 80)
|