Spaces:
Runtime error
Runtime error
ffreemt
commited on
Commit
·
56ad8d6
1
Parent(s):
5f4757d
Back to Qwen/Qwen-7B-Chat
Browse files
app.py
CHANGED
|
@@ -60,8 +60,8 @@ except Exception:
|
|
| 60 |
# Windows
|
| 61 |
logger.warning("Windows, cant run time.tzset()")
|
| 62 |
|
| 63 |
-
model_name = "Qwen/Qwen-7B-Chat" # gone!
|
| 64 |
model_name = "tangger/Qwen-7B-Chat" # try
|
|
|
|
| 65 |
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
| 66 |
|
| 67 |
n_gpus = torch.cuda.device_count()
|
|
@@ -82,7 +82,8 @@ def gen_model(model_name: str):
|
|
| 82 |
model_name,
|
| 83 |
trust_remote_code=True,
|
| 84 |
device_map="auto",
|
| 85 |
-
load_in_4bit=True,
|
|
|
|
| 86 |
max_memory=max_memory,
|
| 87 |
fp16=True,
|
| 88 |
torch_dtype=torch.float16,
|
|
|
|
| 60 |
# Windows
|
| 61 |
logger.warning("Windows, cant run time.tzset()")
|
| 62 |
|
|
|
|
| 63 |
model_name = "tangger/Qwen-7B-Chat" # try
|
| 64 |
+
model_name = "Qwen/Qwen-7B-Chat" # gone!
|
| 65 |
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
| 66 |
|
| 67 |
n_gpus = torch.cuda.device_count()
|
|
|
|
| 82 |
model_name,
|
| 83 |
trust_remote_code=True,
|
| 84 |
device_map="auto",
|
| 85 |
+
# load_in_4bit=True,
|
| 86 |
+
load_in_8bit=True,
|
| 87 |
max_memory=max_memory,
|
| 88 |
fp16=True,
|
| 89 |
torch_dtype=torch.float16,
|