OpenGVLab
/

InternVideo2_5_Chat_8B

Video-Text-to-Text

feature-extraction

Eval Results (legacy)

Model card Files Files and versions

ynhe commited on Feb 18, 2025

Commit

bff14a1

·

verified ·

1 Parent(s): 6dd8f38

Update README.md

Files changed (1) hide show

README.md +1 -1

README.md CHANGED Viewed

@@ -117,7 +117,7 @@ from transformers import AutoModel, AutoTokenizer
 model_path = 'OpenGVLab/InternVideo2_5_Chat_8B'
 tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
-model = AutoModel.from_pretrained(model_path, trust_remote_code=True).half().cuda()
 IMAGENET_MEAN = (0.485, 0.456, 0.406)
 IMAGENET_STD = (0.229, 0.224, 0.225)

 model_path = 'OpenGVLab/InternVideo2_5_Chat_8B'
 tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
+model = AutoModel.from_pretrained(model_path, trust_remote_code=True).half().cuda().to(torch.bfloat16)
 IMAGENET_MEAN = (0.485, 0.456, 0.406)
 IMAGENET_STD = (0.229, 0.224, 0.225)