Spaces:

prithivMLmods
/

Multimodal-VLM-Thinking

Running on Zero

prithivMLmods commited on Oct 15

Commit

713f243

verified ·

1 Parent(s): 81e35f0

update app

Files changed (1) hide show

app.py CHANGED Viewed

@@ -116,7 +116,7 @@ css = """
 """
 MAX_MAX_NEW_TOKENS = 4096
-DEFAULT_MAX_NEW_TOKENS = 2048
 MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -287,9 +287,7 @@ def generate_video(model_name: str, text: str, video_path: str,
     prompt_full = processor.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
     inputs = processor(
-        text=[prompt_full], images=images_for_processor, return_tensors="pt", padding=True,
-        truncation=True, max_length=MAX_INPUT_TOKEN_LENGTH
-    ).to(device)
     streamer = TextIteratorStreamer(processor, skip_prompt=True, skip_special_tokens=True)
     generation_kwargs = {
         **inputs, "streamer": streamer, "max_new_tokens": max_new_tokens,

 """
 MAX_MAX_NEW_TOKENS = 4096
+DEFAULT_MAX_NEW_TOKENS = 1024
 MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     prompt_full = processor.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
     inputs = processor(
+        text=[prompt_full], images=images_for_processor, return_tensors="pt", padding=True).to(device)
     streamer = TextIteratorStreamer(processor, skip_prompt=True, skip_special_tokens=True)
     generation_kwargs = {
         **inputs, "streamer": streamer, "max_new_tokens": max_new_tokens,