Spaces:

arcee-ai
/

arcee-model-testing

Sleeping

Mark-Arcee commited on Apr 1, 2024

Commit

9dc82d4

verified ·

1 Parent(s): 38d64e4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,8 +14,8 @@ DESCRIPTION = "# Arcee Model Testing - current test: arcee-ai/SEC-Calme-7B-Instr
 if not torch.cuda.is_available():
     DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
-MAX_MAX_NEW_TOKENS = 2048
-DEFAULT_MAX_NEW_TOKENS = 1024
 MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
 if torch.cuda.is_available():
@@ -28,7 +28,7 @@ if torch.cuda.is_available():
 def generate(
     message: str,
     chat_history: list[tuple[str, str]],
-    max_new_tokens: int = 1024,
     temperature: float = 0.6,
     top_p: float = 0.9,
     top_k: int = 50,

 if not torch.cuda.is_available():
     DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
+MAX_MAX_NEW_TOKENS = 4096
+DEFAULT_MAX_NEW_TOKENS = 4096
 MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
 if torch.cuda.is_available():
 def generate(
     message: str,
     chat_history: list[tuple[str, str]],
+    max_new_tokens: int = 4096,
     temperature: float = 0.6,
     top_p: float = 0.9,
     top_k: int = 50,