2.0.0
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- console.log +53 -0
- devkit/precision.json +71 -71
- devkit/vlm_config.json +1 -0
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token0_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1024_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1152_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1280_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token128_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1408_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1536_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1664_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1792_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1920_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token256_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token384_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token512_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token640_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token768_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token896_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer0_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer10_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer11_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer12_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer13_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer14_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer15_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer16_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer17_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer18_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer19_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer1_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer20_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer21_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer22_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer23_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer24_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer25_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer26_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer2_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer3_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer4_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer5_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer6_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer7_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer8_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer9_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer0_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer10_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer11_stage1_mla.elf +2 -2
- elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer12_stage1_mla.elf +2 -2
console.log
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
None of PyTorch, TensorFlow >= 2.0, or Flax have been found. Models won't be available and only tokenizers, configuration and file/data utilities can be used.
|
| 2 |
+
None of PyTorch, TensorFlow >= 2.0, or Flax have been found. Models won't be available and only tokenizers, configuration and file/data utilities can be used.
|
| 3 |
+
VLM initialization starting ...
|
| 4 |
+
VLM initialization completed.
|
| 5 |
+
>>> Query: Why is the sky blue?
|
| 6 |
+
Assistant: The sky appears blue because of a phenomenon called Rayleigh scattering, named after the British physicist Lord Rayleigh, who first explained it in the late 19th century.
|
| 7 |
+
|
| 8 |
+
Here's what happens:
|
| 9 |
+
|
| 10 |
+
1. **Sunlight enters Earth's atmosphere**: When sunlight enters our atmosphere, it encounters tiny molecules of gases like nitrogen (N2) and oxygen (O2).
|
| 11 |
+
2. **Scattering occurs**: These gas molecules scatter the light in all directions, but they scatter shorter (blue) wavelengths more than longer (red) wavelengths. This is known as Rayleigh scattering.
|
| 12 |
+
3. **Blue light is scattered**: As a result, the blue light is scattered in all directions, making the sky appear blue to our eyes.
|
| 13 |
+
4. **Red light continues to travel**: The longer wavelengths of light, like red and orange, continue to travel in a straight line, reaching our eyes from a more direct path.
|
| 14 |
+
|
| 15 |
+
This is why the sky typically appears blue during the daytime, especially during clear weather. At sunrise and sunset, the light has to travel through more of the atmosphere, which scatters the shorter wavelengths even more, making the sky appear more red or orange.
|
| 16 |
+
|
| 17 |
+
It's worth noting that the color of the sky can vary depending on atmospheric conditions, like pollution, dust, and water vapor. For example, during a severe thunderstorm or in areas with high levels of pollution, the sky can appear more gray or hazy.
|
| 18 |
+
|
| 19 |
+
So, to summarize, the sky appears blue due to the scattering of sunlight by tiny molecules in the atmosphere, which scatters shorter wavelengths (like blue light) more than longer wavelengths (like red light).
|
| 20 |
+
|
| 21 |
+
Number of generated tokens: 327
|
| 22 |
+
TTFT: 0.21s
|
| 23 |
+
TPS: avg=19.64, quantiles=['20.03', '19.63', '19.58', '19.35']
|
| 24 |
+
>>> Query: Summarize
|
| 25 |
+
Assistant: The sky appears blue due to Rayleigh scattering, where tiny molecules in the atmosphere scatter sunlight, scattering shorter (blue) wavelengths more than longer (red) wavelengths. This scattering occurs when sunlight enters the Earth's atmosphere and encounters gas molecules like nitrogen and oxygen. As a result, blue light is scattered in all directions, making the sky appear blue to our eyes.
|
| 26 |
+
|
| 27 |
+
Number of generated tokens: 74
|
| 28 |
+
TTFT: 0.13s
|
| 29 |
+
TPS: avg=19.10, quantiles=['19.12', '19.10', '19.08', '19.07']
|
| 30 |
+
>>> Query: Tell me a story based on this
|
| 31 |
+
Assistant: Once upon a time, in a small village nestled between two great mountains, there lived a young girl named Luna. Luna was fascinated by the sky and spent most of her days gazing up at it, trying to understand its secrets.
|
| 32 |
+
|
| 33 |
+
One day, while exploring the village, Luna stumbled upon an old wise man named Atlas. Atlas was a master of the stars and the secrets of the universe. He had spent his life studying the movements of the planets and the behavior of light.
|
| 34 |
+
|
| 35 |
+
Luna approached Atlas with a curious mind and a burning question: "Why is the sky blue?" Atlas smiled and began to tell her a story.
|
| 36 |
+
|
| 37 |
+
"Long ago," Atlas said, "the sky was not blue. It was a deep, fiery red, like the embers of a dying fire. But one day, a great storm swept through the land, bringing with it tiny particles of dust and gas. These particles danced in the air, scattering the light of the sun in all directions."
|
| 38 |
+
|
| 39 |
+
Luna's eyes widened with wonder as Atlas continued. "The blue light, being the shortest and most energetic of all, was scattered the most. It bounced off the particles and filled the air with a brilliant blue hue. And so, the sky became blue, a reflection of the beauty and wonder of the universe."
|
| 40 |
+
|
| 41 |
+
Luna listened, entranced, as Atlas told her of the ancient Greeks who had first discovered the secret of the blue sky. She learned of the great scientists who had studied the behavior of light and the tiny molecules that scattered it.
|
| 42 |
+
|
| 43 |
+
As the sun began to set, casting a warm orange glow over the village, Luna looked up at the sky and saw the blue hue for the first time. She felt a sense of wonder and awe, knowing that the sky was not just a simple reflection of the sun's light, but a complex and beautiful dance of particles and light.
|
| 44 |
+
|
| 45 |
+
From that day on, Luna spent every clear night gazing up at the sky, searching for the secrets of the universe and the magic of the blue light that made it all possible. And Atlas, the wise old man, watched over her, guiding her on her journey of discovery and wonder.
|
| 46 |
+
|
| 47 |
+
The story of the blue sky became a legend, passed down through generations of villagers, a reminder of the beauty and wonder of the universe and the magic that lay just beyond the edge of our everyday world.
|
| 48 |
+
|
| 49 |
+
Number of generated tokens: 476
|
| 50 |
+
TTFT: 0.13s
|
| 51 |
+
TPS: avg=18.45, quantiles=['18.80', '18.50', '18.30', '18.09']
|
| 52 |
+
>>> WARN:starting syslog with prefix MLA-RT
|
| 53 |
+
~MLALogger: logger is closed
|
devkit/precision.json
CHANGED
|
@@ -2,357 +2,357 @@
|
|
| 2 |
{
|
| 3 |
"part": "group_pre",
|
| 4 |
"idx": 0,
|
| 5 |
-
"precision": "
|
| 6 |
},
|
| 7 |
{
|
| 8 |
"part": "group_pre",
|
| 9 |
"idx": 1,
|
| 10 |
-
"precision": "
|
| 11 |
},
|
| 12 |
{
|
| 13 |
"part": "group_pre",
|
| 14 |
"idx": 2,
|
| 15 |
-
"precision": "
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"part": "group_pre",
|
| 19 |
"idx": 3,
|
| 20 |
-
"precision": "
|
| 21 |
},
|
| 22 |
{
|
| 23 |
"part": "group_pre",
|
| 24 |
"idx": 4,
|
| 25 |
-
"precision": "
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"part": "group_pre",
|
| 29 |
"idx": 5,
|
| 30 |
-
"precision": "
|
| 31 |
},
|
| 32 |
{
|
| 33 |
"part": "group_pre",
|
| 34 |
"idx": 6,
|
| 35 |
-
"precision": "
|
| 36 |
},
|
| 37 |
{
|
| 38 |
"part": "group_pre",
|
| 39 |
"idx": 7,
|
| 40 |
-
"precision": "
|
| 41 |
},
|
| 42 |
{
|
| 43 |
"part": "group_pre",
|
| 44 |
"idx": 8,
|
| 45 |
-
"precision": "
|
| 46 |
},
|
| 47 |
{
|
| 48 |
"part": "group_pre",
|
| 49 |
"idx": 9,
|
| 50 |
-
"precision": "
|
| 51 |
},
|
| 52 |
{
|
| 53 |
"part": "group_pre",
|
| 54 |
"idx": 10,
|
| 55 |
-
"precision": "
|
| 56 |
},
|
| 57 |
{
|
| 58 |
"part": "group_pre",
|
| 59 |
"idx": 11,
|
| 60 |
-
"precision": "
|
| 61 |
},
|
| 62 |
{
|
| 63 |
"part": "group_pre",
|
| 64 |
"idx": 12,
|
| 65 |
-
"precision": "
|
| 66 |
},
|
| 67 |
{
|
| 68 |
"part": "group_pre",
|
| 69 |
"idx": 13,
|
| 70 |
-
"precision": "
|
| 71 |
},
|
| 72 |
{
|
| 73 |
"part": "group_pre",
|
| 74 |
"idx": 14,
|
| 75 |
-
"precision": "
|
| 76 |
},
|
| 77 |
{
|
| 78 |
"part": "group_pre",
|
| 79 |
"idx": 15,
|
| 80 |
-
"precision": "
|
| 81 |
},
|
| 82 |
{
|
| 83 |
"part": "group_pre",
|
| 84 |
"idx": 16,
|
| 85 |
-
"precision": "
|
| 86 |
},
|
| 87 |
{
|
| 88 |
"part": "group_pre",
|
| 89 |
"idx": 17,
|
| 90 |
-
"precision": "
|
| 91 |
},
|
| 92 |
{
|
| 93 |
"part": "group_pre",
|
| 94 |
"idx": 18,
|
| 95 |
-
"precision": "
|
| 96 |
},
|
| 97 |
{
|
| 98 |
"part": "group_pre",
|
| 99 |
"idx": 19,
|
| 100 |
-
"precision": "
|
| 101 |
},
|
| 102 |
{
|
| 103 |
"part": "group_pre",
|
| 104 |
"idx": 20,
|
| 105 |
-
"precision": "
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"part": "group_pre",
|
| 109 |
"idx": 21,
|
| 110 |
-
"precision": "
|
| 111 |
},
|
| 112 |
{
|
| 113 |
"part": "group_pre",
|
| 114 |
"idx": 22,
|
| 115 |
-
"precision": "
|
| 116 |
},
|
| 117 |
{
|
| 118 |
"part": "group_pre",
|
| 119 |
"idx": 23,
|
| 120 |
-
"precision": "
|
| 121 |
},
|
| 122 |
{
|
| 123 |
"part": "group_pre",
|
| 124 |
"idx": 24,
|
| 125 |
-
"precision": "
|
| 126 |
},
|
| 127 |
{
|
| 128 |
"part": "group_pre",
|
| 129 |
"idx": 25,
|
| 130 |
-
"precision": "
|
| 131 |
},
|
| 132 |
{
|
| 133 |
"part": "group_pre",
|
| 134 |
"idx": 26,
|
| 135 |
-
"precision": "
|
| 136 |
},
|
| 137 |
{
|
| 138 |
"part": "group_pre",
|
| 139 |
"idx": 27,
|
| 140 |
-
"precision": "
|
| 141 |
},
|
| 142 |
{
|
| 143 |
"part": "group_post",
|
| 144 |
"idx": 0,
|
| 145 |
-
"precision": "
|
| 146 |
},
|
| 147 |
{
|
| 148 |
"part": "group_post",
|
| 149 |
"idx": 1,
|
| 150 |
-
"precision": "
|
| 151 |
},
|
| 152 |
{
|
| 153 |
"part": "group_post",
|
| 154 |
"idx": 2,
|
| 155 |
-
"precision": "
|
| 156 |
},
|
| 157 |
{
|
| 158 |
"part": "group_post",
|
| 159 |
"idx": 3,
|
| 160 |
-
"precision": "
|
| 161 |
},
|
| 162 |
{
|
| 163 |
"part": "group_post",
|
| 164 |
"idx": 4,
|
| 165 |
-
"precision": "
|
| 166 |
},
|
| 167 |
{
|
| 168 |
"part": "group_post",
|
| 169 |
"idx": 5,
|
| 170 |
-
"precision": "
|
| 171 |
},
|
| 172 |
{
|
| 173 |
"part": "group_post",
|
| 174 |
"idx": 6,
|
| 175 |
-
"precision": "
|
| 176 |
},
|
| 177 |
{
|
| 178 |
"part": "group_post",
|
| 179 |
"idx": 7,
|
| 180 |
-
"precision": "
|
| 181 |
},
|
| 182 |
{
|
| 183 |
"part": "group_post",
|
| 184 |
"idx": 8,
|
| 185 |
-
"precision": "
|
| 186 |
},
|
| 187 |
{
|
| 188 |
"part": "group_post",
|
| 189 |
"idx": 9,
|
| 190 |
-
"precision": "
|
| 191 |
},
|
| 192 |
{
|
| 193 |
"part": "group_post",
|
| 194 |
"idx": 10,
|
| 195 |
-
"precision": "
|
| 196 |
},
|
| 197 |
{
|
| 198 |
"part": "group_post",
|
| 199 |
"idx": 11,
|
| 200 |
-
"precision": "
|
| 201 |
},
|
| 202 |
{
|
| 203 |
"part": "group_post",
|
| 204 |
"idx": 12,
|
| 205 |
-
"precision": "
|
| 206 |
},
|
| 207 |
{
|
| 208 |
"part": "group_post",
|
| 209 |
"idx": 13,
|
| 210 |
-
"precision": "
|
| 211 |
},
|
| 212 |
{
|
| 213 |
"part": "group_post",
|
| 214 |
"idx": 14,
|
| 215 |
-
"precision": "
|
| 216 |
},
|
| 217 |
{
|
| 218 |
"part": "group_post",
|
| 219 |
"idx": 15,
|
| 220 |
-
"precision": "
|
| 221 |
},
|
| 222 |
{
|
| 223 |
"part": "group_post",
|
| 224 |
"idx": 16,
|
| 225 |
-
"precision": "
|
| 226 |
},
|
| 227 |
{
|
| 228 |
"part": "group_post",
|
| 229 |
"idx": 17,
|
| 230 |
-
"precision": "
|
| 231 |
},
|
| 232 |
{
|
| 233 |
"part": "group_post",
|
| 234 |
"idx": 18,
|
| 235 |
-
"precision": "
|
| 236 |
},
|
| 237 |
{
|
| 238 |
"part": "group_post",
|
| 239 |
"idx": 19,
|
| 240 |
-
"precision": "
|
| 241 |
},
|
| 242 |
{
|
| 243 |
"part": "group_post",
|
| 244 |
"idx": 20,
|
| 245 |
-
"precision": "
|
| 246 |
},
|
| 247 |
{
|
| 248 |
"part": "group_post",
|
| 249 |
"idx": 21,
|
| 250 |
-
"precision": "
|
| 251 |
},
|
| 252 |
{
|
| 253 |
"part": "group_post",
|
| 254 |
"idx": 22,
|
| 255 |
-
"precision": "
|
| 256 |
},
|
| 257 |
{
|
| 258 |
"part": "group_post",
|
| 259 |
"idx": 23,
|
| 260 |
-
"precision": "
|
| 261 |
},
|
| 262 |
{
|
| 263 |
"part": "group_post",
|
| 264 |
"idx": 24,
|
| 265 |
-
"precision": "
|
| 266 |
},
|
| 267 |
{
|
| 268 |
"part": "group_post",
|
| 269 |
"idx": 25,
|
| 270 |
-
"precision": "
|
| 271 |
},
|
| 272 |
{
|
| 273 |
"part": "group_post",
|
| 274 |
"idx": 26,
|
| 275 |
-
"precision": "
|
| 276 |
},
|
| 277 |
{
|
| 278 |
"part": "group_cache",
|
| 279 |
"idx": 0,
|
| 280 |
-
"precision": "
|
| 281 |
},
|
| 282 |
{
|
| 283 |
"part": "group_cache",
|
| 284 |
"idx": 128,
|
| 285 |
-
"precision": "
|
| 286 |
},
|
| 287 |
{
|
| 288 |
"part": "group_cache",
|
| 289 |
"idx": 256,
|
| 290 |
-
"precision": "
|
| 291 |
},
|
| 292 |
{
|
| 293 |
"part": "group_cache",
|
| 294 |
"idx": 384,
|
| 295 |
-
"precision": "
|
| 296 |
},
|
| 297 |
{
|
| 298 |
"part": "group_cache",
|
| 299 |
"idx": 512,
|
| 300 |
-
"precision": "
|
| 301 |
},
|
| 302 |
{
|
| 303 |
"part": "group_cache",
|
| 304 |
"idx": 640,
|
| 305 |
-
"precision": "
|
| 306 |
},
|
| 307 |
{
|
| 308 |
"part": "group_cache",
|
| 309 |
"idx": 768,
|
| 310 |
-
"precision": "
|
| 311 |
},
|
| 312 |
{
|
| 313 |
"part": "group_cache",
|
| 314 |
"idx": 896,
|
| 315 |
-
"precision": "
|
| 316 |
},
|
| 317 |
{
|
| 318 |
"part": "group_cache",
|
| 319 |
"idx": 1024,
|
| 320 |
-
"precision": "
|
| 321 |
},
|
| 322 |
{
|
| 323 |
"part": "group_cache",
|
| 324 |
"idx": 1152,
|
| 325 |
-
"precision": "
|
| 326 |
},
|
| 327 |
{
|
| 328 |
"part": "group_cache",
|
| 329 |
"idx": 1280,
|
| 330 |
-
"precision": "
|
| 331 |
},
|
| 332 |
{
|
| 333 |
"part": "group_cache",
|
| 334 |
"idx": 1408,
|
| 335 |
-
"precision": "
|
| 336 |
},
|
| 337 |
{
|
| 338 |
"part": "group_cache",
|
| 339 |
"idx": 1536,
|
| 340 |
-
"precision": "
|
| 341 |
},
|
| 342 |
{
|
| 343 |
"part": "group_cache",
|
| 344 |
"idx": 1664,
|
| 345 |
-
"precision": "
|
| 346 |
},
|
| 347 |
{
|
| 348 |
"part": "group_cache",
|
| 349 |
"idx": 1792,
|
| 350 |
-
"precision": "
|
| 351 |
},
|
| 352 |
{
|
| 353 |
"part": "group_cache",
|
| 354 |
"idx": 1920,
|
| 355 |
-
"precision": "
|
| 356 |
},
|
| 357 |
{
|
| 358 |
"part": "single_pre",
|
|
|
|
| 2 |
{
|
| 3 |
"part": "group_pre",
|
| 4 |
"idx": 0,
|
| 5 |
+
"precision": "A_BF16_W_INT8"
|
| 6 |
},
|
| 7 |
{
|
| 8 |
"part": "group_pre",
|
| 9 |
"idx": 1,
|
| 10 |
+
"precision": "A_BF16_W_INT8"
|
| 11 |
},
|
| 12 |
{
|
| 13 |
"part": "group_pre",
|
| 14 |
"idx": 2,
|
| 15 |
+
"precision": "A_BF16_W_INT8"
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"part": "group_pre",
|
| 19 |
"idx": 3,
|
| 20 |
+
"precision": "A_BF16_W_INT8"
|
| 21 |
},
|
| 22 |
{
|
| 23 |
"part": "group_pre",
|
| 24 |
"idx": 4,
|
| 25 |
+
"precision": "A_BF16_W_INT8"
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"part": "group_pre",
|
| 29 |
"idx": 5,
|
| 30 |
+
"precision": "A_BF16_W_INT8"
|
| 31 |
},
|
| 32 |
{
|
| 33 |
"part": "group_pre",
|
| 34 |
"idx": 6,
|
| 35 |
+
"precision": "A_BF16_W_INT8"
|
| 36 |
},
|
| 37 |
{
|
| 38 |
"part": "group_pre",
|
| 39 |
"idx": 7,
|
| 40 |
+
"precision": "A_BF16_W_INT8"
|
| 41 |
},
|
| 42 |
{
|
| 43 |
"part": "group_pre",
|
| 44 |
"idx": 8,
|
| 45 |
+
"precision": "A_BF16_W_INT8"
|
| 46 |
},
|
| 47 |
{
|
| 48 |
"part": "group_pre",
|
| 49 |
"idx": 9,
|
| 50 |
+
"precision": "A_BF16_W_INT8"
|
| 51 |
},
|
| 52 |
{
|
| 53 |
"part": "group_pre",
|
| 54 |
"idx": 10,
|
| 55 |
+
"precision": "A_BF16_W_INT8"
|
| 56 |
},
|
| 57 |
{
|
| 58 |
"part": "group_pre",
|
| 59 |
"idx": 11,
|
| 60 |
+
"precision": "A_BF16_W_INT8"
|
| 61 |
},
|
| 62 |
{
|
| 63 |
"part": "group_pre",
|
| 64 |
"idx": 12,
|
| 65 |
+
"precision": "A_BF16_W_INT8"
|
| 66 |
},
|
| 67 |
{
|
| 68 |
"part": "group_pre",
|
| 69 |
"idx": 13,
|
| 70 |
+
"precision": "A_BF16_W_INT8"
|
| 71 |
},
|
| 72 |
{
|
| 73 |
"part": "group_pre",
|
| 74 |
"idx": 14,
|
| 75 |
+
"precision": "A_BF16_W_INT8"
|
| 76 |
},
|
| 77 |
{
|
| 78 |
"part": "group_pre",
|
| 79 |
"idx": 15,
|
| 80 |
+
"precision": "A_BF16_W_INT8"
|
| 81 |
},
|
| 82 |
{
|
| 83 |
"part": "group_pre",
|
| 84 |
"idx": 16,
|
| 85 |
+
"precision": "A_BF16_W_INT8"
|
| 86 |
},
|
| 87 |
{
|
| 88 |
"part": "group_pre",
|
| 89 |
"idx": 17,
|
| 90 |
+
"precision": "A_BF16_W_INT8"
|
| 91 |
},
|
| 92 |
{
|
| 93 |
"part": "group_pre",
|
| 94 |
"idx": 18,
|
| 95 |
+
"precision": "A_BF16_W_INT8"
|
| 96 |
},
|
| 97 |
{
|
| 98 |
"part": "group_pre",
|
| 99 |
"idx": 19,
|
| 100 |
+
"precision": "A_BF16_W_INT8"
|
| 101 |
},
|
| 102 |
{
|
| 103 |
"part": "group_pre",
|
| 104 |
"idx": 20,
|
| 105 |
+
"precision": "A_BF16_W_INT8"
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"part": "group_pre",
|
| 109 |
"idx": 21,
|
| 110 |
+
"precision": "A_BF16_W_INT8"
|
| 111 |
},
|
| 112 |
{
|
| 113 |
"part": "group_pre",
|
| 114 |
"idx": 22,
|
| 115 |
+
"precision": "A_BF16_W_INT8"
|
| 116 |
},
|
| 117 |
{
|
| 118 |
"part": "group_pre",
|
| 119 |
"idx": 23,
|
| 120 |
+
"precision": "A_BF16_W_INT8"
|
| 121 |
},
|
| 122 |
{
|
| 123 |
"part": "group_pre",
|
| 124 |
"idx": 24,
|
| 125 |
+
"precision": "A_BF16_W_INT8"
|
| 126 |
},
|
| 127 |
{
|
| 128 |
"part": "group_pre",
|
| 129 |
"idx": 25,
|
| 130 |
+
"precision": "A_BF16_W_INT8"
|
| 131 |
},
|
| 132 |
{
|
| 133 |
"part": "group_pre",
|
| 134 |
"idx": 26,
|
| 135 |
+
"precision": "A_BF16_W_INT8"
|
| 136 |
},
|
| 137 |
{
|
| 138 |
"part": "group_pre",
|
| 139 |
"idx": 27,
|
| 140 |
+
"precision": "A_BF16_W_INT8"
|
| 141 |
},
|
| 142 |
{
|
| 143 |
"part": "group_post",
|
| 144 |
"idx": 0,
|
| 145 |
+
"precision": "A_BF16_W_INT8"
|
| 146 |
},
|
| 147 |
{
|
| 148 |
"part": "group_post",
|
| 149 |
"idx": 1,
|
| 150 |
+
"precision": "A_BF16_W_INT8"
|
| 151 |
},
|
| 152 |
{
|
| 153 |
"part": "group_post",
|
| 154 |
"idx": 2,
|
| 155 |
+
"precision": "A_BF16_W_INT8"
|
| 156 |
},
|
| 157 |
{
|
| 158 |
"part": "group_post",
|
| 159 |
"idx": 3,
|
| 160 |
+
"precision": "A_BF16_W_INT8"
|
| 161 |
},
|
| 162 |
{
|
| 163 |
"part": "group_post",
|
| 164 |
"idx": 4,
|
| 165 |
+
"precision": "A_BF16_W_INT8"
|
| 166 |
},
|
| 167 |
{
|
| 168 |
"part": "group_post",
|
| 169 |
"idx": 5,
|
| 170 |
+
"precision": "A_BF16_W_INT8"
|
| 171 |
},
|
| 172 |
{
|
| 173 |
"part": "group_post",
|
| 174 |
"idx": 6,
|
| 175 |
+
"precision": "A_BF16_W_INT8"
|
| 176 |
},
|
| 177 |
{
|
| 178 |
"part": "group_post",
|
| 179 |
"idx": 7,
|
| 180 |
+
"precision": "A_BF16_W_INT8"
|
| 181 |
},
|
| 182 |
{
|
| 183 |
"part": "group_post",
|
| 184 |
"idx": 8,
|
| 185 |
+
"precision": "A_BF16_W_INT8"
|
| 186 |
},
|
| 187 |
{
|
| 188 |
"part": "group_post",
|
| 189 |
"idx": 9,
|
| 190 |
+
"precision": "A_BF16_W_INT8"
|
| 191 |
},
|
| 192 |
{
|
| 193 |
"part": "group_post",
|
| 194 |
"idx": 10,
|
| 195 |
+
"precision": "A_BF16_W_INT8"
|
| 196 |
},
|
| 197 |
{
|
| 198 |
"part": "group_post",
|
| 199 |
"idx": 11,
|
| 200 |
+
"precision": "A_BF16_W_INT8"
|
| 201 |
},
|
| 202 |
{
|
| 203 |
"part": "group_post",
|
| 204 |
"idx": 12,
|
| 205 |
+
"precision": "A_BF16_W_INT8"
|
| 206 |
},
|
| 207 |
{
|
| 208 |
"part": "group_post",
|
| 209 |
"idx": 13,
|
| 210 |
+
"precision": "A_BF16_W_INT8"
|
| 211 |
},
|
| 212 |
{
|
| 213 |
"part": "group_post",
|
| 214 |
"idx": 14,
|
| 215 |
+
"precision": "A_BF16_W_INT8"
|
| 216 |
},
|
| 217 |
{
|
| 218 |
"part": "group_post",
|
| 219 |
"idx": 15,
|
| 220 |
+
"precision": "A_BF16_W_INT8"
|
| 221 |
},
|
| 222 |
{
|
| 223 |
"part": "group_post",
|
| 224 |
"idx": 16,
|
| 225 |
+
"precision": "A_BF16_W_INT8"
|
| 226 |
},
|
| 227 |
{
|
| 228 |
"part": "group_post",
|
| 229 |
"idx": 17,
|
| 230 |
+
"precision": "A_BF16_W_INT8"
|
| 231 |
},
|
| 232 |
{
|
| 233 |
"part": "group_post",
|
| 234 |
"idx": 18,
|
| 235 |
+
"precision": "A_BF16_W_INT8"
|
| 236 |
},
|
| 237 |
{
|
| 238 |
"part": "group_post",
|
| 239 |
"idx": 19,
|
| 240 |
+
"precision": "A_BF16_W_INT8"
|
| 241 |
},
|
| 242 |
{
|
| 243 |
"part": "group_post",
|
| 244 |
"idx": 20,
|
| 245 |
+
"precision": "A_BF16_W_INT8"
|
| 246 |
},
|
| 247 |
{
|
| 248 |
"part": "group_post",
|
| 249 |
"idx": 21,
|
| 250 |
+
"precision": "A_BF16_W_INT8"
|
| 251 |
},
|
| 252 |
{
|
| 253 |
"part": "group_post",
|
| 254 |
"idx": 22,
|
| 255 |
+
"precision": "A_BF16_W_INT8"
|
| 256 |
},
|
| 257 |
{
|
| 258 |
"part": "group_post",
|
| 259 |
"idx": 23,
|
| 260 |
+
"precision": "A_BF16_W_INT8"
|
| 261 |
},
|
| 262 |
{
|
| 263 |
"part": "group_post",
|
| 264 |
"idx": 24,
|
| 265 |
+
"precision": "A_BF16_W_INT8"
|
| 266 |
},
|
| 267 |
{
|
| 268 |
"part": "group_post",
|
| 269 |
"idx": 25,
|
| 270 |
+
"precision": "A_BF16_W_INT8"
|
| 271 |
},
|
| 272 |
{
|
| 273 |
"part": "group_post",
|
| 274 |
"idx": 26,
|
| 275 |
+
"precision": "A_BF16_W_INT8"
|
| 276 |
},
|
| 277 |
{
|
| 278 |
"part": "group_cache",
|
| 279 |
"idx": 0,
|
| 280 |
+
"precision": "A_BF16_W_INT8"
|
| 281 |
},
|
| 282 |
{
|
| 283 |
"part": "group_cache",
|
| 284 |
"idx": 128,
|
| 285 |
+
"precision": "A_BF16_W_INT8"
|
| 286 |
},
|
| 287 |
{
|
| 288 |
"part": "group_cache",
|
| 289 |
"idx": 256,
|
| 290 |
+
"precision": "A_BF16_W_INT8"
|
| 291 |
},
|
| 292 |
{
|
| 293 |
"part": "group_cache",
|
| 294 |
"idx": 384,
|
| 295 |
+
"precision": "A_BF16_W_INT8"
|
| 296 |
},
|
| 297 |
{
|
| 298 |
"part": "group_cache",
|
| 299 |
"idx": 512,
|
| 300 |
+
"precision": "A_BF16_W_INT8"
|
| 301 |
},
|
| 302 |
{
|
| 303 |
"part": "group_cache",
|
| 304 |
"idx": 640,
|
| 305 |
+
"precision": "A_BF16_W_INT8"
|
| 306 |
},
|
| 307 |
{
|
| 308 |
"part": "group_cache",
|
| 309 |
"idx": 768,
|
| 310 |
+
"precision": "A_BF16_W_INT8"
|
| 311 |
},
|
| 312 |
{
|
| 313 |
"part": "group_cache",
|
| 314 |
"idx": 896,
|
| 315 |
+
"precision": "A_BF16_W_INT8"
|
| 316 |
},
|
| 317 |
{
|
| 318 |
"part": "group_cache",
|
| 319 |
"idx": 1024,
|
| 320 |
+
"precision": "A_BF16_W_INT8"
|
| 321 |
},
|
| 322 |
{
|
| 323 |
"part": "group_cache",
|
| 324 |
"idx": 1152,
|
| 325 |
+
"precision": "A_BF16_W_INT8"
|
| 326 |
},
|
| 327 |
{
|
| 328 |
"part": "group_cache",
|
| 329 |
"idx": 1280,
|
| 330 |
+
"precision": "A_BF16_W_INT8"
|
| 331 |
},
|
| 332 |
{
|
| 333 |
"part": "group_cache",
|
| 334 |
"idx": 1408,
|
| 335 |
+
"precision": "A_BF16_W_INT8"
|
| 336 |
},
|
| 337 |
{
|
| 338 |
"part": "group_cache",
|
| 339 |
"idx": 1536,
|
| 340 |
+
"precision": "A_BF16_W_INT8"
|
| 341 |
},
|
| 342 |
{
|
| 343 |
"part": "group_cache",
|
| 344 |
"idx": 1664,
|
| 345 |
+
"precision": "A_BF16_W_INT8"
|
| 346 |
},
|
| 347 |
{
|
| 348 |
"part": "group_cache",
|
| 349 |
"idx": 1792,
|
| 350 |
+
"precision": "A_BF16_W_INT8"
|
| 351 |
},
|
| 352 |
{
|
| 353 |
"part": "group_cache",
|
| 354 |
"idx": 1920,
|
| 355 |
+
"precision": "A_BF16_W_INT8"
|
| 356 |
},
|
| 357 |
{
|
| 358 |
"part": "single_pre",
|
devkit/vlm_config.json
CHANGED
|
@@ -58,6 +58,7 @@
|
|
| 58 |
},
|
| 59 |
"pipeline_cfg": {
|
| 60 |
"system_prompt": null,
|
|
|
|
| 61 |
"max_num_tokens": 2048,
|
| 62 |
"input_token_group_size": 128,
|
| 63 |
"input_token_group_offsets": [
|
|
|
|
| 58 |
},
|
| 59 |
"pipeline_cfg": {
|
| 60 |
"system_prompt": null,
|
| 61 |
+
"chat_template": null,
|
| 62 |
"max_num_tokens": 2048,
|
| 63 |
"input_token_group_size": 128,
|
| 64 |
"input_token_group_offsets": [
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token0_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca700b22e336c83e71d880148fc48790736e2aa79d25b1a25c9b91ace5b46297
|
| 3 |
+
size 3401432
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1024_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5a46169a6ef8fccd0d039a5b0f9bdfb93f26a71d187492796be4b1ab90aaeab9
|
| 3 |
+
size 10845272
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1152_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5ef188745c39367a33ab9063e2b09fca4e11dea0c381b8818cddf868d35b119
|
| 3 |
+
size 13135256
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1280_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f7de46dcae36af5daeaec2d934c045ee2136188870bfc0156b1cb367a275031
|
| 3 |
+
size 12327728
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token128_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70ebb28ee3f4c51f24ecdceca2c3a863f0f62ca4a1565c420d55525614c6b2c5
|
| 3 |
+
size 4233104
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1408_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:896cb3c3aae95b8e7ab7c1f74b902b7c9eb62eaf21a8a3fa48a958b575a3b9cc
|
| 3 |
+
size 15098336
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1536_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:405fa5b6f5ce843d3f6419891b1140c44be8d533043a09536cb144aeb9ecae5a
|
| 3 |
+
size 12033840
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1664_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2de1cab87bdc81a223154d3ecbb303690087edaa41fb27049df94cb9265b4a1c
|
| 3 |
+
size 12084936
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1792_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0e1848620773150da324539516d61a425c74f08fe2ebdae20f0176d9f93c609c
|
| 3 |
+
size 13031456
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token1920_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29f68808d78245db93cb412cf22ceabdf9df91707dac3280af7e237b6eee85ab
|
| 3 |
+
size 13259552
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token256_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ba56b4e2ef804240fa93cc37da5d0193bd451c22f2b89cf3031a47a3ea99e9c
|
| 3 |
+
size 4396720
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token384_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20bc01829749925f9eb22110a3fbf35236524a171132b7841303690d4de224e0
|
| 3 |
+
size 4621064
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token512_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac8590821dbdb8ce3a9faff797fa4180bb57cb64e16545ce657437298411111f
|
| 3 |
+
size 5901152
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token640_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d3b95e893a63f13b38645496a47df5a14e1b78d909634ee121dabd08f889ff5
|
| 3 |
+
size 5997512
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token768_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f97a8933bafba66a4fe026ff39ac46427212672d1f9090c01918852d7bdd32e9
|
| 3 |
+
size 6072704
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_cache_token896_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc8d79b37a359a6d6df883eb6f22e4eaf7566a9dbb73f9692a89db15accab2fb
|
| 3 |
+
size 7383576
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer0_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89bb0d4f3b764e057e61c189a21c2d011d07160c66ef4513cb99ed391d882538
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer10_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4fe12defe5da30929f5b14abf21ada4dfe4801c6393a306274f657b4ca5ef9d0
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer11_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c877069bef2789388b91bf6f93115493e3c0c8a34903e98572f5f9d9ff7cc689
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer12_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d98da92ff4256586df904d73d066564d85e24d45ba5659a3f4bb1e693a09139d
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer13_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a855e8efaa8f1d7336306a604f1a68217b16409d5e652b18c83e1357e3ef4568
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer14_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbfacc6c8746d483c117a5283cbb5d5ce64ebadaf75bc17f36663302e207ee56
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer15_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89e5a35fe6b214ee4e323b77142467f890cafcd7f19e4e9fe629bf439a2772db
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer16_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90b6727a850ec028597ad824043122d0071471dc9ec18cb653b53a47f61a5195
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer17_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b46df5861eea55437dae07b00452cc9a0c3c96dcceefbfa33e85b47946d0b3e
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer18_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:06372bb3504f5ef095645b2f5c2c477f4b4c79d4447e22303541b7cae8253b3b
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer19_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75a855b5426a45f291592f11a3af059f54cc5417b8b8ee9b7a209dc8cb3f3893
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer1_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f17bb9d7dc55a8acdd9ad0a577bbd5091b1f97cd80d61c404148b8edb40a3d3
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer20_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:986b0496a5ac6e0f7137d1b92b3cd88b817167f2891b771a26b0cf69cd2e0f9e
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer21_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:503cbf9435c4c674855ecba6a158fe70dbb82f93bf908abb80e25274aa77c867
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer22_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f54c127c779643907294d47887a26ada15aa14eece2ad7008155e94c87bc1c49
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer23_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db38a4c71ceede23f9ef22c02ef34f1afefe09398f03a8b0c1a1f2bcd53367c0
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer24_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:94ce53f2e040c14c0e87aa92d227057e5a9825478ea5ed99bdb597aea5a9c944
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer25_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5e5d0aafb478ae9a08979c1305eb0a7e0929a84714f710b59f3b0e809e77a19a
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer26_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a4687c78ab9fd4a075712d097ed63d4bfbf9a7504f3a43e4d2eb4fde1eac2e5b
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer2_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cda2ae33cfb044af3071daf7dba0daeb0b626482e2dd8eb761d294317764ba6
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer3_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e14ddbe272e944c4a9983752cb998e5659b71d0e032875feca4b77afe595579
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer4_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b9d966a14b28ee545f25b52a16f3c74a472ebe6bded9f313a4e2186ee482564
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer5_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:242a872951efdcb3c4ded087d180a4ab78a1dbb05a852ff0bc3660cbc681923a
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer6_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f485ccfd524293afdfc88d8f71c8dcd299aba0733a6ea474d48d26199ff763a0
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer7_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9dd6b6a9054e367b7860a17fb23cccf8bd7b6bbe23b88b86bad97b8218622841
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer8_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:117c81f47e8281d330636d2136930e016a37da02e33a4084a40c2b8a57e4bf05
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_post_layer9_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59a0eabd082e0cc3459ace47288f654850ea093194e970d034ac42849395200a
|
| 3 |
+
size 97409136
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer0_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15ef21defe8ecd945fdfff0a60b70c319d2d975a1083f6ce12848a025b96fb80
|
| 3 |
+
size 21807424
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer10_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a96ab9b78c2d0bbbb5eeeb3083469fd2aff5ee50477a1d47288aaf6467d241ec
|
| 3 |
+
size 21807424
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer11_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3978d4768b3d95f57f48c8a717f2565a627036ad8ca4e1da309fb6fe26233e76
|
| 3 |
+
size 21807424
|
elf_files/models--meta-llama--Llama-3.2-3B-Instruct_language_n128_pre_layer12_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88336f6ed59be62f94df6612a0dc2758c11a23c7f8358358346506a947a492f3
|
| 3 |
+
size 21807424
|