Spaces:

noppodev
/

NoppoIntelligence

Sleeping

App Files Files Community

noppodev commited on Apr 12

Commit

1c327ab

verified ·

1 Parent(s): 9beded6

Update app.py

Browse files

Files changed (1) hide show

app.py +46 -99

app.py CHANGED Viewed

@@ -2,115 +2,62 @@ import os
 import subprocess
 import shutil
 import gradio as gr
-from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline, BitsAndBytesConfig
-import torch
 from huggingface_hub import HfApi
-# ---------------------------------------------------------
-# 1. モデル準備セクション (ストレージ清掃 + 認証 + マージ)
-# ---------------------------------------------------------
-def prepare_model():
-    model_path = "./ni_v1_model"
-    token = os.getenv("HF_TOKEN")
-    if not os.path.exists(model_path):
-        print("🧹 ストレージ確保のため、古い残骸を掃除するぜ...")
         if os.path.exists(model_path):
             shutil.rmtree(model_path)
-        print("🚀 NI-v1 マージ開始...")
-        env = os.environ.copy()
-        if token:
-            env["HF_TOKEN"] = token
-            # 2026年最新の hf コマンドで認証
-            try:
-                subprocess.run(["hf", "auth", "login", "--token", token], check=True)
-            except:
-                print("⚠️ 認証コマンド失敗。環境変数のみで続行するぜ。")
-        try:
-            # ストレージとメモリを節約するオプション付きでマージ実行
-            subprocess.run(
-                ["mergekit-yaml", "config.yaml", model_path,
-                 "--allow-crimes",
-                 "--lazy-unpickle",
-                 "--low-cpu-mem"],
-                check=True,
-                env=env
-            )
-            print("✨ マージ成功。のっぽ、やったぜ！")
-        except:
-            raise RuntimeError("マージ失敗。config.yaml のレイヤー数を減らしてくれ。")
-    print("🧠 NI-v1 ロード中 (4-bit 量子化でメモリ節約モード)...")
-    # メモリ不足対策の量子化設定
-    bnb_config = BitsAndBytesConfig(
-        load_in_4bit=True,
-        bnb_4bit_compute_dtype=torch.bfloat16,
-        bnb_4bit_quant_type="nf4",
-        bnb_4bit_use_double_quant=True,
-    )
-    tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
-    model = AutoModelForCausalLM.from_pretrained(
-        model_path,
-        quantization_config=bnb_config, # ここでメモリを大幅節約
-        device_map="auto",
-        trust_remote_code=True
-    )
-    return pipeline("text-generation", model=model, tokenizer=tokenizer)
-# ユニット起動
-try:
-    pipe = prepare_model()
-except Exception as e:
-    print(f"起動失敗: {e}")
-    pipe = None
-# ---------------------------------------------------------
-# 2. 推論ロジック
-# ---------------------------------------------------------
-def predict(message, history):
-    if pipe is None:
-        return "知能ユニットが起動してないぜ。容量不足かロードエラーだ。"
-    # ユーザー指定のプロンプト形式
-    prompt = f"<|im_start|>user\n{message}<|im_end|>\n<|im_start|>assistant\n"
-    outputs = pipe(prompt, max_new_tokens=512, do_sample=True, temperature=0.7)
-    # 応答部分を抽出
-    response = outputs[0]['generated_text'].split("assistant\n")[-1].replace("<|im_end|>", "")
-    return response
-# ---------------------------------------------------------
-# 3. UIセクション (ChatInterfaceで送信エラーを物理的に防ぐ)
-# ---------------------------------------------------------
-with gr.Blocks(title="NI-v1.0") as demo:
-    gr.Markdown("# 🤖 Noppo-Intelligence v1.0")
-    with gr.Tab("チャット"):
-        # 履歴管理をGradioに任せるのが、送信エラーを回避する一番の近道だ
-        gr.ChatInterface(fn=predict)
-    with gr.Tab("公開"):
-        gr.Markdown("### 完成した NI-v1 を Hugging Face にアップロード")
-        # リポジトリ名はのっぽ指定のもの
-        repo_id = gr.Textbox(label="Repo ID", value="noppodev/NoppoIntelligence")
-        user_token = gr.Textbox(label="Write Token (HF_TOKEN)", type="password")
-        pub_btn = gr.Button("アップロード開始")
-        status = gr.Textbox(label="Status")
-        def upload(r, t):
-            try:
-                api = HfApi()
-                api.create_repo(repo_id=r, repo_type="model", exist_ok=True)
-                api.upload_folder(folder_path="./ni_v1_model", repo_id=r, token=t)
-                return "✅ アップロード完了！BeyondIntelligenceへの第一歩だ。"
-            except Exception as e:
-                return f"❌ エラー発生: {e}"
-        pub_btn.click(upload, [repo_id, user_token], status)
 if __name__ == "__main__":
     demo.launch(server_name="0.0.0.0", server_port=7860)

 import subprocess
 import shutil
 import gradio as gr
 from huggingface_hub import HfApi
+# 1. 処理ロジック
+def run_factory(repo_id, token):
+    if not repo_id or not token:
+        return "❌ Repo IDとTokenを入れてくれ！"
+    model_path = "./ni_v1_model"
+    env = os.environ.copy()
+    env["HF_TOKEN"] = token
+    try:
+        # 古い残骸を掃除
         if os.path.exists(model_path):
             shutil.rmtree(model_path)
+        # 認証
+        print("🚀 認証中...")
+        subprocess.run(["hf", "auth", "login", "--token", token], check=True)
+        # マージ実行 (lazy-unpickleでメモリ節約)
+        print("🚀 マージ開始...")
+        subprocess.run(
+            ["mergekit-yaml", "config.yaml", model_path,
+             "--allow-crimes", "--lazy-unpickle", "--low-cpu-mem"],
+            check=True, env=env
+        )
+        # アップロード実行
+        print("🚀 アップロード開始...")
+        api = HfApi()
+        api.create_repo(repo_id=repo_id, repo_type="model", exist_ok=True)
+        api.upload_folder(
+            folder_path=model_path,
+            repo_id=repo_id,
+            token=token,
+            commit_message="NI-v1.0 generated by NoppoStudio Factory"
+        )
+        return f"✅ 成功だぜ！\nリポジトリ: https://huggingface.co/{repo_id}\n今すぐColabで動かそうぜ！"
+    except Exception as e:
+        return f"❌ エラー発生: {str(e)}"
+# 2. UI
+with gr.Blocks(title="NI-v1 Factory") as demo:
+    gr.Markdown("# 🏭 Noppo-Intelligence v1.0 Factory")
+    gr.Markdown("Spaces(CPU)でマージだけ行い、完成品をリポジトリへ自動転送するぜ。")
+    with gr.Column():
+        repo = gr.Textbox(label="転送先 Repo ID", value="noppodev/NoppoIntelligence")
+        token = gr.Textbox(label="Hugging Face Write Token", type="password")
+        start_btn = gr.Button("マージ＆アップロード��始", variant="primary")
+        output = gr.Textbox(label="ログ / 結果", interactive=False)
+    start_btn.click(run_factory, [repo, token], output)
 if __name__ == "__main__":
     demo.launch(server_name="0.0.0.0", server_port=7860)