Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -54,7 +54,7 @@ def oai_error(message: str, code: str = "internal_error", status: int = 500):
|
|
| 54 |
# N_CTX=2048 (or 3072 if you can afford more latency)
|
| 55 |
# N_BATCH=512 or 1024 (try 1024 first)
|
| 56 |
N_THREADS = int(os.environ.get("N_THREADS", "2"))
|
| 57 |
-
N_CTX = int(os.environ.get("N_CTX", "
|
| 58 |
N_BATCH = int(os.environ.get("N_BATCH", "1024"))
|
| 59 |
MAX_TOKENS_DEFAULT = int(os.environ.get("MAX_TOKENS_DEFAULT", "256"))
|
| 60 |
CTX_MARGIN = int(os.environ.get("CTX_MARGIN", "96"))
|
|
|
|
| 54 |
# N_CTX=2048 (or 3072 if you can afford more latency)
|
| 55 |
# N_BATCH=512 or 1024 (try 1024 first)
|
| 56 |
N_THREADS = int(os.environ.get("N_THREADS", "2"))
|
| 57 |
+
N_CTX = int(os.environ.get("N_CTX", "3072"))
|
| 58 |
N_BATCH = int(os.environ.get("N_BATCH", "1024"))
|
| 59 |
MAX_TOKENS_DEFAULT = int(os.environ.get("MAX_TOKENS_DEFAULT", "256"))
|
| 60 |
CTX_MARGIN = int(os.environ.get("CTX_MARGIN", "96"))
|