English
naveensp commited on
Commit
43e609b
·
verified ·
1 Parent(s): 4e9d1c9

Delete llava_olmo_explore.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. llava_olmo_explore.py +0 -51
llava_olmo_explore.py DELETED
@@ -1,51 +0,0 @@
1
- import torch
2
- import sys
3
- from OLMo_Bitnet_1B.model import OLMo
4
- from OLMo_Bitnet_1B.config import ModelConfig
5
- from OLMo_Bitnet_1B.configuration_olmo import OLMoConfig
6
- from OLMo_Bitnet_1B.modeling_olmo import OLMoForCausalLM
7
- import json
8
- from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline, TextStreamer
9
- import llava.model.language_model.llava_olmo1p58b as llava_olmo
10
- import PIL
11
- import torchvision
12
-
13
- device = torch.device('cuda:5' if torch.cuda.is_available() else 'cpu')
14
- torch.manual_seed(42)
15
-
16
- with open('llava/config.json') as json_file:
17
- data = json.load(json_file)
18
- config_class = llava_olmo.LlavaOLMoBitnet1BConfig(**data)
19
-
20
- # config_class = OLMoConfig(**data)
21
- model = OLMoForCausalLM(config_class).to(device)
22
- model.load_state_dict(torch.load('OLMo_Bitnet_1B/pytorch_model.bin'))
23
-
24
- model.eval()
25
-
26
- # tokenizer = AutoTokenizer.from_pretrained("NousResearch/OLMo-Bitnet-1B")
27
-
28
- tokenizer = AutoTokenizer.from_pretrained(
29
- "NousResearch/OLMo-Bitnet-1B",
30
- cache_dir="./cache/",
31
- model_max_length=1024,
32
- padding_side="right",
33
- pad_token_id=1,
34
- unk_token='<|padding|>',
35
- )
36
-
37
- text = "Paris is a historic city with architectural marvels. It is also "
38
-
39
-
40
- inputs = tokenizer(text, return_tensors='pt', return_token_type_ids=False).to(device)
41
-
42
- # response = model.generate(**inputs, max_new_tokens=100, do_sample=True, top_k=50, top_p=0.95)
43
-
44
-
45
- # llava olmo setup
46
- image_tensor = torchvision.io.read_image('playground/data/LLaVA-Pretrain/images/00316/003163402.jpg')
47
- lolmo = llava_olmo.LlavaOLMoBitnet1BForCausalLM(config_class).to(device)
48
- lolmo.load_state_dict(torch.load('OLMo_Bitnet_1B/pytorch_model.bin'), strict=False)
49
- response = lolmo.generate(inputs=inputs['input_ids'], max_new_tokens=100, do_sample=True, top_k=50, top_p=0.95)
50
-
51
- print(tokenizer.batch_decode(response, skip_special_tokens=True)[0])