damerajee
/

GPT-Vision

Vision Language Model

Model card Files Files and versions

damerajee commited on Jul 29, 2024

Commit

3423e05

·

verified ·

1 Parent(s): c3d5c9a

Update modeling_gpt2vision.py

Files changed (1) hide show

modeling_gpt2vision.py +0 -2

modeling_gpt2vision.py CHANGED Viewed

@@ -67,7 +67,6 @@ class GPT2Vision(PreTrainedModel):
             return_tensors="pt",
         ).to(device)
-        print("text_inputs",text_inputs)
         # Adjust attention mask to account for image tokens and the extra <image> token
         batch_size = text_inputs.input_ids.shape[0]
         img_attention = torch.ones((batch_size, self.img_tokens + 1), dtype=torch.long, device=device)
@@ -100,7 +99,6 @@ class GPT2Vision(PreTrainedModel):
     def generate(self, question, image, max_new_tokens=30, **kwargs):
         prompt = f"\n\nQuestion:<image>{question}\n\nAnswer:"
-        print("prompt",prompt)
         batch = {"image": [image], "text": prompt}
         encoded_batch = self.tokenize_encode(batch, self.device)
         inputs_embeds, attention_mask = self.preprocess_inputs(encoded_batch)

             return_tensors="pt",
         ).to(device)
         # Adjust attention mask to account for image tokens and the extra <image> token
         batch_size = text_inputs.input_ids.shape[0]
         img_attention = torch.ones((batch_size, self.img_tokens + 1), dtype=torch.long, device=device)
     def generate(self, question, image, max_new_tokens=30, **kwargs):
         prompt = f"\n\nQuestion:<image>{question}\n\nAnswer:"
         batch = {"image": [image], "text": prompt}
         encoded_batch = self.tokenize_encode(batch, self.device)
         inputs_embeds, attention_mask = self.preprocess_inputs(encoded_batch)