Spaces:

AxisCommunity
/

OrionPax

Runtime error

App Files Files Community

AxisCommunity commited on 10 days ago

Commit

ef63875

verified ·

1 Parent(s): cc2e612

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -27

app.py CHANGED Viewed

@@ -1,36 +1,20 @@
-import os
 import gradio as gr
 from transformers import LlamaForCausalLM, LlamaTokenizer
-from huggingface_hub import hf_hub_download
 import torch
-model_id = "AxisCommunity/OrionZetAI_1.0V"
-print("Загрузка токенизатора...")
 tokenizer = LlamaTokenizer.from_pretrained(model_id)
-print("Проверка файлов модели OrionPax в облаке...")
-config_path = hf_hub_download(repo_id=model_id, filename="config.json")
-local_dir = os.path.dirname(config_path)
-# Проверяем файлы весов и делаем линк
-possible_files = ["orion_model.safetensors", "model.safetensors"]
-for f in possible_files:
-    try:
-        weight_path = hf_hub_download(repo_id=model_id, filename=f)
-        standard_path = os.path.join(local_dir, "model.safetensors")
-        if weight_path != standard_path and not os.path.exists(standard_path):
-            print(f"Создаем линк для {f} -> model.safetensors")
-            os.symlink(weight_path, standard_path)
-        break
-    except Exception:
-        continue
-print("Загрузка OrionPax в память сервера...")
 model = LlamaForCausalLM.from_pretrained(
-    local_dir,
     torch_dtype=torch.float16,
-    device_map="auto"
 )
 def generate(text):
@@ -42,19 +26,19 @@ def generate(text):
     with torch.no_grad():
         output = model.generate(
             **inputs,
-            max_new_tokens=150,
             temperature=0.7,
             do_sample=True
         )
     return tokenizer.decode(output[0], skip_special_tokens=True)
-# Интерфейс Gradio с новым крутым названием!
 demo = gr.Interface(
     fn=generate,
     inputs=gr.Textbox(lines=3, placeholder="Напиши что-нибудь OrionPax..."),
     outputs="text",
-    title="OrionPax AI Cloud 1.0V"  # <-- Твое новое имя проекта!
 )
 demo.launch()

 import gradio as gr
 from transformers import LlamaForCausalLM, LlamaTokenizer
 import torch
+# Указываем твое новое правильное имя репозитория моделей
+model_id = "AxisCommunity/OrionPaxAI_1.0V"
+print("Загрузка токенизатора для OrionPax...")
 tokenizer = LlamaTokenizer.from_pretrained(model_id)
+print("Загрузка весов OrionPax (включаем экономию ОЗУ)...")
+# Метод автоматически найдет файл orion_model.safetensors, так как он один в репо
 model = LlamaForCausalLM.from_pretrained(
+    model_id,
     torch_dtype=torch.float16,
+    low_cpu_mem_usage=True,  # Это спасет бесплатный сервер от зависания памяти!
+    device_map="auto"        # Автоматическое распределение
 )
 def generate(text):
     with torch.no_grad():
         output = model.generate(
             **inputs,
+            max_new_tokens=100,  # Оптимально для быстрой генерации в облаке
             temperature=0.7,
             do_sample=True
         )
     return tokenizer.decode(output[0], skip_special_tokens=True)
+# Интерфейс Gradio
 demo = gr.Interface(
     fn=generate,
     inputs=gr.Textbox(lines=3, placeholder="Напиши что-нибудь OrionPax..."),
     outputs="text",
+    title="OrionPax AI Cloud 1.0V"
 )
 demo.launch()