Update main.py
Browse files
main.py
CHANGED
|
@@ -28,13 +28,13 @@ MODEL_ID = os.getenv("MODEL_ID", "")
|
|
| 28 |
|
| 29 |
DEFAULT_TEMP = float(os.getenv("DEFAULT_TEMPERATURE", "0.6"))
|
| 30 |
DEFAULT_TOP_P = float(os.getenv("DEFAULT_TOP_P", "0.95"))
|
| 31 |
-
DEFAULT_TOKENS = int(os.getenv("DEFAULT_MAX_TOKENS", "
|
| 32 |
|
| 33 |
REQUEST_TIMEOUT = int(os.getenv("REQUEST_TIMEOUT", "120"))
|
| 34 |
MAX_RETRIES = int(os.getenv("MAX_RETRIES", "3"))
|
| 35 |
RETRY_BASE_DELAY = float(os.getenv("RETRY_BASE_DELAY", "1.5"))
|
| 36 |
|
| 37 |
-
MAX_INPUT_TOKENS =
|
| 38 |
|
| 39 |
# przybliżone przeliczenie: 1 token ~ 4 znaki
|
| 40 |
AVG_CHARS_PER_TOKEN = 4
|
|
|
|
| 28 |
|
| 29 |
DEFAULT_TEMP = float(os.getenv("DEFAULT_TEMPERATURE", "0.6"))
|
| 30 |
DEFAULT_TOP_P = float(os.getenv("DEFAULT_TOP_P", "0.95"))
|
| 31 |
+
DEFAULT_TOKENS = int(os.getenv("DEFAULT_MAX_TOKENS", "16000"))
|
| 32 |
|
| 33 |
REQUEST_TIMEOUT = int(os.getenv("REQUEST_TIMEOUT", "120"))
|
| 34 |
MAX_RETRIES = int(os.getenv("MAX_RETRIES", "3"))
|
| 35 |
RETRY_BASE_DELAY = float(os.getenv("RETRY_BASE_DELAY", "1.5"))
|
| 36 |
|
| 37 |
+
MAX_INPUT_TOKENS = 16000 # stała wartość
|
| 38 |
|
| 39 |
# przybliżone przeliczenie: 1 token ~ 4 znaki
|
| 40 |
AVG_CHARS_PER_TOKEN = 4
|