Spaces:
Runtime error
Runtime error
Update agent.py
Browse files
agent.py
CHANGED
|
@@ -161,10 +161,10 @@ try:
|
|
| 161 |
logger.info(f"Используемое устройство: {device}")
|
| 162 |
|
| 163 |
# Инициализация Qwen2-7B
|
| 164 |
-
qwen_tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2-1.5B-Instruct")
|
| 165 |
qwen_model = AutoModelForCausalLM.from_pretrained(
|
| 166 |
-
|
| 167 |
-
"Qwen/Qwen2-1.5B-Instruct",
|
| 168 |
device_map="auto",
|
| 169 |
load_in_4bit=True if device == "cuda" else False, # Квантование для GPU
|
| 170 |
torch_dtype=torch.float16 if device == "cuda" else torch.float32
|
|
@@ -880,8 +880,8 @@ def create_answer(state: AgentState) -> AgentState:
|
|
| 880 |
logger.info(f"Используемое устройство: {device}")
|
| 881 |
qwen_tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2-7B-Instruct")
|
| 882 |
qwen_model = AutoModelForCausalLM.from_pretrained(
|
| 883 |
-
|
| 884 |
-
"Qwen/Qwen2-1.5B-Instruct",
|
| 885 |
device_map="auto",
|
| 886 |
torch_dtype=torch.bfloat16, # Используем bfloat16 для экономии памяти
|
| 887 |
low_cpu_mem_usage=True # Оптимизация для CPU
|
|
|
|
| 161 |
logger.info(f"Используемое устройство: {device}")
|
| 162 |
|
| 163 |
# Инициализация Qwen2-7B
|
| 164 |
+
qwen_tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2-7B-Instruct") # ("Qwen/Qwen2-1.5B-Instruct")
|
| 165 |
qwen_model = AutoModelForCausalLM.from_pretrained(
|
| 166 |
+
"Qwen/Qwen2-7B-Instruct",
|
| 167 |
+
# "Qwen/Qwen2-1.5B-Instruct",
|
| 168 |
device_map="auto",
|
| 169 |
load_in_4bit=True if device == "cuda" else False, # Квантование для GPU
|
| 170 |
torch_dtype=torch.float16 if device == "cuda" else torch.float32
|
|
|
|
| 880 |
logger.info(f"Используемое устройство: {device}")
|
| 881 |
qwen_tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2-7B-Instruct")
|
| 882 |
qwen_model = AutoModelForCausalLM.from_pretrained(
|
| 883 |
+
"Qwen/Qwen2-7B-Instruct",
|
| 884 |
+
# "Qwen/Qwen2-1.5B-Instruct",
|
| 885 |
device_map="auto",
|
| 886 |
torch_dtype=torch.bfloat16, # Используем bfloat16 для экономии памяти
|
| 887 |
low_cpu_mem_usage=True # Оптимизация для CPU
|