Spaces:
Runtime error
Runtime error
Commit
·
784d667
1
Parent(s):
2598f17
Update app.py
Browse files
app.py
CHANGED
|
@@ -20,7 +20,7 @@ def init_args():
|
|
| 20 |
args.config_path = './config/llama_7b.json'
|
| 21 |
args.spm_model_path = './model_file/tokenizer.model'
|
| 22 |
args.batch_size = 1
|
| 23 |
-
args.seq_length =
|
| 24 |
args.world_size = 1
|
| 25 |
args.use_int8 = True
|
| 26 |
args.top_p = 0
|
|
@@ -42,9 +42,6 @@ def init_model():
|
|
| 42 |
model = load_model(model, args.load_model_path)
|
| 43 |
model.eval()
|
| 44 |
|
| 45 |
-
# for name, parameter in model.named_parameters():
|
| 46 |
-
# print(name)
|
| 47 |
-
# print(parameter)
|
| 48 |
print(torch.cuda.max_memory_allocated() / 1024 ** 3)
|
| 49 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
| 50 |
model.to(device)
|
|
|
|
| 20 |
args.config_path = './config/llama_7b.json'
|
| 21 |
args.spm_model_path = './model_file/tokenizer.model'
|
| 22 |
args.batch_size = 1
|
| 23 |
+
args.seq_length = 256
|
| 24 |
args.world_size = 1
|
| 25 |
args.use_int8 = True
|
| 26 |
args.top_p = 0
|
|
|
|
| 42 |
model = load_model(model, args.load_model_path)
|
| 43 |
model.eval()
|
| 44 |
|
|
|
|
|
|
|
|
|
|
| 45 |
print(torch.cuda.max_memory_allocated() / 1024 ** 3)
|
| 46 |
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
|
| 47 |
model.to(device)
|