ROBO-R1984

Build error

App Files Files Community

openfree commited on Jun 16, 2025

Commit

3c39492

verified ·

1 Parent(s): bbe7924

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -5

app.py CHANGED Viewed

@@ -25,6 +25,9 @@ from io import BytesIO
 from llama_cpp import Llama
 from llama_cpp.llama_chat_format import Llava16ChatHandler
 # CSV/TXT 분석
 import pandas as pd
 # PDF 텍스트 추출
@@ -210,6 +213,37 @@ def image_to_base64_data_uri(image: Union[np.ndarray, Image.Image]) -> str:
 ##############################################################################
 # 모델 로드
 ##############################################################################
 @spaces.GPU(duration=120)
 def load_model():
     global llm, model_loaded
@@ -222,9 +256,8 @@ def load_model():
         logger.info("Gemma3-R1984-4B GGUF Q4_K_M 모델 로딩 시작...")
         clear_cuda_cache()
-        # 모델 경로 설정
-        model_path = os.getenv("MODEL_PATH", "VIDraft/Gemma-3-R1984-4B-GGUF/Gemma-3-R1984-4B.Q4_K_M.gguf")
-        mmproj_path = os.getenv("MMPROJ_PATH", "VIDraft/Gemma-3-R1984-4B-GGUF/Gemma-3-R1984-4B.mmproj-Q8_0.gguf")
         # GPU 사용 가능 여부 확인
         n_gpu_layers = -1 if torch.cuda.is_available() else 0
@@ -253,6 +286,8 @@ def load_model():
     except Exception as e:
         logger.error(f"모델 로딩 실패: {e}")
         return False
 ##############################################################################
@@ -807,8 +842,8 @@ with gr.Blocks(title="🤖 로봇 시각 시스템 (Gemma3-4B GGUF)", css=css) a
     # 초기 모델 로드
     def initial_load():
-        load_model()
-        return "시스템 준비 완료! 🚀"
     demo.load(
         fn=initial_load,

 from llama_cpp import Llama
 from llama_cpp.llama_chat_format import Llava16ChatHandler
+# Model download
+from huggingface_hub import hf_hub_download
 # CSV/TXT 분석
 import pandas as pd
 # PDF 텍스트 추출
 ##############################################################################
 # 모델 로드
 ##############################################################################
+def download_model_files():
+    """Hugging Face Hub에서 모델 파일 다운로드"""
+    model_repo = "VIDraft/Gemma-3-R1984-4B-GGUF"
+    # 메인 모델 다운로드
+    model_filename = "Gemma-3-R1984-4B.Q4_K_M.gguf"
+    logger.info(f"모델 다운로드 중: {model_filename}")
+    model_path = hf_hub_download(
+        repo_id=model_repo,
+        filename=model_filename,
+        resume_download=True,
+        local_files_only=False
+    )
+    # Vision projection 파일 다운로드
+    mmproj_filename = "Gemma-3-R1984-4B.mmproj-Q8_0.gguf"
+    logger.info(f"Vision 모델 다운로드 중: {mmproj_filename}")
+    mmproj_path = hf_hub_download(
+        repo_id=model_repo,
+        filename=mmproj_filename,
+        resume_download=True,
+        local_files_only=False
+    )
+    logger.info(f"모델 경로: {model_path}")
+    logger.info(f"Vision 경로: {mmproj_path}")
+    return model_path, mmproj_path
 @spaces.GPU(duration=120)
 def load_model():
     global llm, model_loaded
         logger.info("Gemma3-R1984-4B GGUF Q4_K_M 모델 로딩 시작...")
         clear_cuda_cache()
+        # 모델 파일 다운로드
+        model_path, mmproj_path = download_model_files()
         # GPU 사용 가능 여부 확인
         n_gpu_layers = -1 if torch.cuda.is_available() else 0
     except Exception as e:
         logger.error(f"모델 로딩 실패: {e}")
+        import traceback
+        logger.error(traceback.format_exc())
         return False
 ##############################################################################
     # 초기 모델 로드
     def initial_load():
+        # 첫 실행 시 GPU에서 모델 로드
+        return "시스템 준비 완료! 첫 분석 시 모델이 자동으로 로드됩니다. 🚀"
     demo.load(
         fn=initial_load,