valentinfrlch commited on
Commit
b4f2de0
·
verified ·
1 Parent(s): 2653ad0

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +2 -35
README.md CHANGED
@@ -13,14 +13,6 @@ tags:
13
  - on-device
14
  language:
15
  - en
16
- - de
17
- - nl
18
- - fr
19
- - es
20
- - pt
21
- - it
22
- - pl
23
- - sv
24
  extra_gated_heading: Access Glimpse-v1
25
  extra_gated_description: >-
26
  Glimpse-v1 is a Model Derivative of Google's Gemma and is distributed under
@@ -84,7 +76,7 @@ Glimpse-v1 reports a **1.9× accuracy improvement** over the base Gemma 3 4B mod
84
 
85
  ## Training
86
 
87
- - **Base:** Gemma 3 4B (instruction-tuned)
88
  - **Data:** ~5,000 curated real-world home security camera events spanning diverse scenes, lighting conditions, and event types
89
  - **Objective:** Supervised fine-tuning for concise, factual event descriptions
90
 
@@ -101,45 +93,26 @@ ollama run llmvision/glimpse-v1
101
 
102
  ### Transformers
103
  ```
104
-
105
  from transformers import AutoProcessor, AutoModelForImageTextToText
106
-
107
  import torch
108
-
109
- model_id = "<your-hf-username>/glimpse-v1"
110
-
111
  processor = AutoProcessor.from_pretrained(model_id)
112
-
113
  model = AutoModelForImageTextToText.from_pretrained(
114
-
115
  model_id, torch_dtype=torch.bfloat16, device_map="auto"
116
-
117
  )
118
 
119
  messages = [
120
-
121
  {"role": "user", "content": [
122
-
123
  {"type": "image", "url": "path/to/frame.jpg"},
124
-
125
  {"type": "text", "text": "Summarize this camera event in one sentence."},
126
-
127
  ]},
128
-
129
  ]
130
-
131
  inputs = processor.apply_chat_template(
132
-
133
  messages, add_generation_prompt=True, tokenize=True,
134
-
135
  return_dict=True, return_tensors="pt",
136
-
137
  ).to(model.device)
138
-
139
  out = model.generate(inputs, max_new_tokens=128)
140
-
141
  print(processor.decode(out[0], skip_special_tokens=True))
142
-
143
  ```
144
 
145
  ## Limitations and risks
@@ -164,17 +137,11 @@ By downloading or using Glimpse-v1 you agree to the Gemma Terms of Use. If you r
164
  ## Citation
165
 
166
  ```
167
-
168
  @misc{glimpse_v1_2026,
169
-
170
  title = {Glimpse-v1: A compact vision-language model for home security event understanding},
171
-
172
  author = {LLM Vision},
173
-
174
  year = {2026},
175
-
176
  url = {https://llmvision.org/glimpse/}
177
-
178
  }
179
 
180
  ```
 
13
  - on-device
14
  language:
15
  - en
 
 
 
 
 
 
 
 
16
  extra_gated_heading: Access Glimpse-v1
17
  extra_gated_description: >-
18
  Glimpse-v1 is a Model Derivative of Google's Gemma and is distributed under
 
76
 
77
  ## Training
78
 
79
+ - **Base:** Gemma 3 4B
80
  - **Data:** ~5,000 curated real-world home security camera events spanning diverse scenes, lighting conditions, and event types
81
  - **Objective:** Supervised fine-tuning for concise, factual event descriptions
82
 
 
93
 
94
  ### Transformers
95
  ```
 
96
  from transformers import AutoProcessor, AutoModelForImageTextToText
 
97
  import torch
98
+ model_id = "llmvision/glimpse-v1"
 
 
99
  processor = AutoProcessor.from_pretrained(model_id)
 
100
  model = AutoModelForImageTextToText.from_pretrained(
 
101
  model_id, torch_dtype=torch.bfloat16, device_map="auto"
 
102
  )
103
 
104
  messages = [
 
105
  {"role": "user", "content": [
 
106
  {"type": "image", "url": "path/to/frame.jpg"},
 
107
  {"type": "text", "text": "Summarize this camera event in one sentence."},
 
108
  ]},
 
109
  ]
 
110
  inputs = processor.apply_chat_template(
 
111
  messages, add_generation_prompt=True, tokenize=True,
 
112
  return_dict=True, return_tensors="pt",
 
113
  ).to(model.device)
 
114
  out = model.generate(inputs, max_new_tokens=128)
 
115
  print(processor.decode(out[0], skip_special_tokens=True))
 
116
  ```
117
 
118
  ## Limitations and risks
 
137
  ## Citation
138
 
139
  ```
 
140
  @misc{glimpse_v1_2026,
 
141
  title = {Glimpse-v1: A compact vision-language model for home security event understanding},
 
142
  author = {LLM Vision},
 
143
  year = {2026},
 
144
  url = {https://llmvision.org/glimpse/}
 
145
  }
146
 
147
  ```