Spaces:
Runtime error
Runtime error
Commit
·
492f975
1
Parent(s):
aed5af0
Update app.py
Browse files
app.py
CHANGED
|
@@ -7,6 +7,8 @@ from models.tokenize import Tokenizer
|
|
| 7 |
from models.llama import *
|
| 8 |
from generate import LmGeneration
|
| 9 |
|
|
|
|
|
|
|
| 10 |
|
| 11 |
args = None
|
| 12 |
lm_generation = None
|
|
@@ -22,7 +24,7 @@ def init_args():
|
|
| 22 |
args.batch_size = 1
|
| 23 |
args.seq_length = 512
|
| 24 |
args.world_size = 1
|
| 25 |
-
args.use_int8 =
|
| 26 |
args.top_p = 0
|
| 27 |
args.repetition_penalty_range = 1024
|
| 28 |
args.repetition_penalty_slope = 0
|
|
|
|
| 7 |
from models.llama import *
|
| 8 |
from generate import LmGeneration
|
| 9 |
|
| 10 |
+
import os
|
| 11 |
+
os.environ['CUDA_LAUNCH_BLOCKING'] = '1'
|
| 12 |
|
| 13 |
args = None
|
| 14 |
lm_generation = None
|
|
|
|
| 24 |
args.batch_size = 1
|
| 25 |
args.seq_length = 512
|
| 26 |
args.world_size = 1
|
| 27 |
+
args.use_int8 = False
|
| 28 |
args.top_p = 0
|
| 29 |
args.repetition_penalty_range = 1024
|
| 30 |
args.repetition_penalty_slope = 0
|