andrewqian123
/

LLAMA_BATCH

Visual Question Answering

Model card Files Files and versions

andrewqian123 commited on Sep 3, 2024

Commit

9451981

·

verified ·

1 Parent(s): 7531a10

Update modeling_minicpmv.py

Files changed (1) hide show

modeling_minicpmv.py +10 -1

modeling_minicpmv.py CHANGED Viewed

@@ -272,7 +272,16 @@ class MiniCPMV(MiniCPMVPreTrainedModel):
             counter += 1
             batch.append(input_embeds)
-        batch = torch.cat(batch, dim=0)
         # output_ids = self._decode(input_embeds, tokenizer, **kwargs)
         if stream:
             kwargs.pop("decode_text")

             counter += 1
             batch.append(input_embeds)
+        # batch = torch.cat(batch, dim=0)
+        # pad_sequence(embeddings_list, batch_first=True, padding_value=0.0)
+        max_length = max(tensor.shape[1] for tensor in batch)
+        # Step 2: Automatically pad each tensor to have the same length (L) in the last dimension
+        padded_tensors = [torch.nn.functional.pad(tensor, (0, max_length - tensor.shape[1])) for tensor in batch]
+        # Step 3: Stack the padded tensors into a single batch
+        batch = torch.cat(padded_tensors, dim=0)
         # output_ids = self._decode(input_embeds, tokenizer, **kwargs)
         if stream:
             kwargs.pop("decode_text")