Spaces:

noppodev
/

NoppoIntelligence

Sleeping

App Files Files Community

noppodev commited on Apr 12

Commit

755fbc6

verified ·

1 Parent(s): 6b2ead8

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -16

app.py CHANGED Viewed

@@ -1,38 +1,49 @@
 import os
 import subprocess
 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
 import torch
 from huggingface_hub import HfApi
-# ---------------------------------------------------------
-# 1. モデル準備 (2026年最新 hf コマンド対応)
-# ---------------------------------------------------------
 def prepare_model():
     model_path = "./ni_v1_model"
     token = os.getenv("HF_TOKEN")
     if not os.path.exists(model_path):
         print("🚀 NI-v1 マージ開始...")
         env = os.environ.copy()
         if token:
             env["HF_TOKEN"] = token
-            # 2026年最新の hf コマンドを使用
             try:
                 subprocess.run(["hf", "auth", "login", "--token", token], check=True)
             except:
-                # 万が一 hf が入ってない場合でも、環境変数だけでマージを試みる
-                print("⚠️ hf auth login 失敗。環境変数のみで続行します。")
         try:
             subprocess.run(
-                ["mergekit-yaml", "config.yaml", model_path, "--allow-crimes"],
                 check=True,
                 env=env
             )
-            print("✨ マージ成功。")
         except:
-            raise RuntimeError("マージ失敗。設定を確認してくれ。")
     print("🧠 NI-v1 ロード中...")
     tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
@@ -44,7 +55,6 @@ def prepare_model():
     )
     return pipeline("text-generation", model=model, tokenizer=tokenizer)
-# 起動
 try:
     pipe = prepare_model()
 except Exception as e:
@@ -57,21 +67,16 @@ def predict(message, history):
     outputs = pipe(prompt, max_new_tokens=512, do_sample=True, temperature=0.7)
     return outputs[0]['generated_text'].split("assistant\n")[-1].replace("<|im_end|>", "")
-# ---------------------------------------------------------
-# 2. UI (Gradio バージョン差異を吸収)
-# ---------------------------------------------------------
 with gr.Blocks(title="NI-v1.0") as demo:
     gr.Markdown("# 🤖 Noppo-Intelligence v1.0")
     with gr.Tab("チャット"):
-        # TypeError 回避: type 引数を使わず、デフォルト設定で起動
         gr.ChatInterface(fn=predict)
     with gr.Tab("公開"):
-        gr.Markdown("### 完成した NI-v1 を Hugging Face にアップロード")
         repo_id = gr.Textbox(label="Repo ID", value="noppodev/NoppoIntelligence")
         user_token = gr.Textbox(label="Write Token", type="password")
-        pub_btn = gr.Button("アップロード開始")
         status = gr.Textbox(label="Status")
         def upload(r, t):

 import os
 import subprocess
+import shutil
 import gradio as gr
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
 import torch
 from huggingface_hub import HfApi
 def prepare_model():
     model_path = "./ni_v1_model"
+    # Hugging Faceのキャッシュディレクトリ（ここがパンクの元）
+    cache_path = os.path.expanduser("~/.cache/huggingface/hub")
     token = os.getenv("HF_TOKEN")
     if not os.path.exists(model_path):
+        print("🧹 ストレージ確保のため、古い残骸を掃除するぜ...")
+        # 以前のマージ失敗作があれば削除
+        if os.path.exists(model_path):
+            shutil.rmtree(model_path)
+        # もし容量がギリギリならキャッシュも消す（再ダウンロードになるけど背に腹は代えられない）
+        # shutil.rmtree(cache_path, ignore_errors=True)
         print("🚀 NI-v1 マージ開始...")
         env = os.environ.copy()
         if token:
             env["HF_TOKEN"] = token
             try:
                 subprocess.run(["hf", "auth", "login", "--token", token], check=True)
             except:
+                print("⚠️ ログインスキップ（環境変数で続行）")
         try:
+            # --lazy-unpickle: メモリとディスク消費を抑える魔法の引数
+            # --low-cpu-mem: さらに負荷を減らす
             subprocess.run(
+                ["mergekit-yaml", "config.yaml", model_path,
+                 "--allow-crimes",
+                 "--lazy-unpickle",
+                 "--low-cpu-mem"],
                 check=True,
                 env=env
             )
+            print("✨ マージ成功。のっぽ、耐えたぜ！")
         except:
+            raise RuntimeError("マージ失敗。容量か設定を見直してくれ。")
     print("🧠 NI-v1 ロード中...")
     tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
     )
     return pipeline("text-generation", model=model, tokenizer=tokenizer)
 try:
     pipe = prepare_model()
 except Exception as e:
     outputs = pipe(prompt, max_new_tokens=512, do_sample=True, temperature=0.7)
     return outputs[0]['generated_text'].split("assistant\n")[-1].replace("<|im_end|>", "")
 with gr.Blocks(title="NI-v1.0") as demo:
     gr.Markdown("# 🤖 Noppo-Intelligence v1.0")
     with gr.Tab("チャット"):
         gr.ChatInterface(fn=predict)
     with gr.Tab("公開"):
         repo_id = gr.Textbox(label="Repo ID", value="noppodev/NoppoIntelligence")
         user_token = gr.Textbox(label="Write Token", type="password")
+        pub_btn = gr.Button("アップロード")
         status = gr.Textbox(label="Status")
         def upload(r, t):