2.0.0
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- console.log +36 -0
- devkit/.vlm_config.json.swp +0 -0
- devkit/precision.json +79 -79
- devkit/vlm_config.json +1 -0
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token0_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1024_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1152_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1280_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token128_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1408_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1536_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1664_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1792_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1920_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token256_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token384_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token512_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token640_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token768_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token896_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer0_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer10_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer11_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer12_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer13_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer14_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer15_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer16_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer17_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer18_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer19_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer1_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer20_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer21_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer22_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer23_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer24_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer25_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer26_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer27_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer28_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer29_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer2_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer30_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer3_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer4_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer5_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer6_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer7_stage1_mla.elf +2 -2
- elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer8_stage1_mla.elf +2 -2
console.log
ADDED
|
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
None of PyTorch, TensorFlow >= 2.0, or Flax have been found. Models won't be available and only tokenizers, configuration and file/data utilities can be used.
|
| 2 |
+
None of PyTorch, TensorFlow >= 2.0, or Flax have been found. Models won't be available and only tokenizers, configuration and file/data utilities can be used.
|
| 3 |
+
VLM initialization starting ...
|
| 4 |
+
VLM initialization completed.
|
| 5 |
+
>>> Query: Why is the sky blue?
|
| 6 |
+
Assistant: The sky appears blue because of a process called Rayleigh scattering. As sunlight reaches Earth, it's made up of different wavelengths or colors. Shorter wavelengths (like blue and violet) are scattered in all directions more than longer wavelengths (like red, orange, and yellow). The Earth's atmosphere scatters short-wavelength light more, and since we're more likely to see the scattered blue and violet light, the sky appears blue to us. However, the human eye is more sensitive to blue light and less sensitive to violet light, so we perceive the sky as blue, not violet. Additionally, sunlight reaches us more from the blue part of the spectrum, as the sun is higher in the sky during the day, and the blue light is scattered more by the atmosphere. At sunset, when the sun is lower in the sky, the longer wavelengths (red, orange, and yellow) are scattered more, and we see the sky change colors.
|
| 7 |
+
|
| 8 |
+
Number of generated tokens: 211
|
| 9 |
+
TTFT: 0.49s
|
| 10 |
+
TPS: avg=10.99, quantiles=['11.09', '11.07', '10.90', '10.88']
|
| 11 |
+
>>> Query: Summarize
|
| 12 |
+
Assistant: The sky appears blue because of a process called Rayleigh scattering, where shorter wavelengths (like blue and violet) are scattered in all directions more than longer wavelengths (like red, orange, and yellow) by the Earth's atmosphere. The human eye is more sensitive to blue light and less sensitive to violet light, so we perceive the sky as blue, not violet. Additionally, sunlight reaches us more from the blue part of the spectrum, as the sun is higher in the sky during the day, and the blue light is scattered more by the atmosphere. At sunset, when the sun is lower in the sky, the longer wavelengths (red, orange, and yellow) are scattered more, and we see the sky change colors.
|
| 13 |
+
|
| 14 |
+
Number of generated tokens: 159
|
| 15 |
+
TTFT: 0.35s
|
| 16 |
+
TPS: avg=10.81, quantiles=['10.83', '10.81', '10.80', '10.79']
|
| 17 |
+
>>> Query: Tell me a story based on this
|
| 18 |
+
Assistant: Once upon a time, in a small village nestled between the mountains, lived a young girl named Aria. Every day, Aria would spend hours gazing at the sky, marveling at its ever-changing hues.
|
| 19 |
+
|
| 20 |
+
One day, as Aria sat by the river, she noticed something unusual. The sky was not its usual blue, but a deep, rich purple. Intrigued, she decided to find out why.
|
| 21 |
+
|
| 22 |
+
She spent the next few days researching and studying the behavior of light. She learned about the process of Rayleigh scattering, where shorter wavelengths (like blue and violet) are scattered in all directions more than longer wavelengths (like red, orange, and yellow) by the Earth's atmosphere.
|
| 23 |
+
|
| 24 |
+
Armed with this new knowledge, Aria set out to share her findings with the village. The villagers were amazed by her discovery and thanked her for her hard work.
|
| 25 |
+
|
| 26 |
+
From that day on, Aria became known as the "Sky Whisperer" and continued to share her love for the sky with everyone in the village. Every night, the villagers would gather around Aria as she pointed out constellations, planets, and other celestial wonders.
|
| 27 |
+
|
| 28 |
+
Years passed, and Aria grew old, but her love for the sky never faded. She continued to share her knowledge with the younger generations, inspiring them to look up and marvel at the beauty of the universe.
|
| 29 |
+
|
| 30 |
+
And so, the story of Aria, the Sky Whisperer, became a legend in the small village, and her love for the sky lived on in the hearts of all who knew her.
|
| 31 |
+
|
| 32 |
+
Number of generated tokens: 354
|
| 33 |
+
TTFT: 0.36s
|
| 34 |
+
TPS: avg=10.52, quantiles=['10.62', '10.56', '10.54', '10.40']
|
| 35 |
+
>>> WARN:starting syslog with prefix MLA-RT
|
| 36 |
+
~MLALogger: logger is closed
|
devkit/.vlm_config.json.swp
ADDED
|
Binary file (12.3 kB). View file
|
|
|
devkit/precision.json
CHANGED
|
@@ -2,397 +2,397 @@
|
|
| 2 |
{
|
| 3 |
"part": "group_pre",
|
| 4 |
"idx": 0,
|
| 5 |
-
"precision": "
|
| 6 |
},
|
| 7 |
{
|
| 8 |
"part": "group_pre",
|
| 9 |
"idx": 1,
|
| 10 |
-
"precision": "
|
| 11 |
},
|
| 12 |
{
|
| 13 |
"part": "group_pre",
|
| 14 |
"idx": 2,
|
| 15 |
-
"precision": "
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"part": "group_pre",
|
| 19 |
"idx": 3,
|
| 20 |
-
"precision": "
|
| 21 |
},
|
| 22 |
{
|
| 23 |
"part": "group_pre",
|
| 24 |
"idx": 4,
|
| 25 |
-
"precision": "
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"part": "group_pre",
|
| 29 |
"idx": 5,
|
| 30 |
-
"precision": "
|
| 31 |
},
|
| 32 |
{
|
| 33 |
"part": "group_pre",
|
| 34 |
"idx": 6,
|
| 35 |
-
"precision": "
|
| 36 |
},
|
| 37 |
{
|
| 38 |
"part": "group_pre",
|
| 39 |
"idx": 7,
|
| 40 |
-
"precision": "
|
| 41 |
},
|
| 42 |
{
|
| 43 |
"part": "group_pre",
|
| 44 |
"idx": 8,
|
| 45 |
-
"precision": "
|
| 46 |
},
|
| 47 |
{
|
| 48 |
"part": "group_pre",
|
| 49 |
"idx": 9,
|
| 50 |
-
"precision": "
|
| 51 |
},
|
| 52 |
{
|
| 53 |
"part": "group_pre",
|
| 54 |
"idx": 10,
|
| 55 |
-
"precision": "
|
| 56 |
},
|
| 57 |
{
|
| 58 |
"part": "group_pre",
|
| 59 |
"idx": 11,
|
| 60 |
-
"precision": "
|
| 61 |
},
|
| 62 |
{
|
| 63 |
"part": "group_pre",
|
| 64 |
"idx": 12,
|
| 65 |
-
"precision": "
|
| 66 |
},
|
| 67 |
{
|
| 68 |
"part": "group_pre",
|
| 69 |
"idx": 13,
|
| 70 |
-
"precision": "
|
| 71 |
},
|
| 72 |
{
|
| 73 |
"part": "group_pre",
|
| 74 |
"idx": 14,
|
| 75 |
-
"precision": "
|
| 76 |
},
|
| 77 |
{
|
| 78 |
"part": "group_pre",
|
| 79 |
"idx": 15,
|
| 80 |
-
"precision": "
|
| 81 |
},
|
| 82 |
{
|
| 83 |
"part": "group_pre",
|
| 84 |
"idx": 16,
|
| 85 |
-
"precision": "
|
| 86 |
},
|
| 87 |
{
|
| 88 |
"part": "group_pre",
|
| 89 |
"idx": 17,
|
| 90 |
-
"precision": "
|
| 91 |
},
|
| 92 |
{
|
| 93 |
"part": "group_pre",
|
| 94 |
"idx": 18,
|
| 95 |
-
"precision": "
|
| 96 |
},
|
| 97 |
{
|
| 98 |
"part": "group_pre",
|
| 99 |
"idx": 19,
|
| 100 |
-
"precision": "
|
| 101 |
},
|
| 102 |
{
|
| 103 |
"part": "group_pre",
|
| 104 |
"idx": 20,
|
| 105 |
-
"precision": "
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"part": "group_pre",
|
| 109 |
"idx": 21,
|
| 110 |
-
"precision": "
|
| 111 |
},
|
| 112 |
{
|
| 113 |
"part": "group_pre",
|
| 114 |
"idx": 22,
|
| 115 |
-
"precision": "
|
| 116 |
},
|
| 117 |
{
|
| 118 |
"part": "group_pre",
|
| 119 |
"idx": 23,
|
| 120 |
-
"precision": "
|
| 121 |
},
|
| 122 |
{
|
| 123 |
"part": "group_pre",
|
| 124 |
"idx": 24,
|
| 125 |
-
"precision": "
|
| 126 |
},
|
| 127 |
{
|
| 128 |
"part": "group_pre",
|
| 129 |
"idx": 25,
|
| 130 |
-
"precision": "
|
| 131 |
},
|
| 132 |
{
|
| 133 |
"part": "group_pre",
|
| 134 |
"idx": 26,
|
| 135 |
-
"precision": "
|
| 136 |
},
|
| 137 |
{
|
| 138 |
"part": "group_pre",
|
| 139 |
"idx": 27,
|
| 140 |
-
"precision": "
|
| 141 |
},
|
| 142 |
{
|
| 143 |
"part": "group_pre",
|
| 144 |
"idx": 28,
|
| 145 |
-
"precision": "
|
| 146 |
},
|
| 147 |
{
|
| 148 |
"part": "group_pre",
|
| 149 |
"idx": 29,
|
| 150 |
-
"precision": "
|
| 151 |
},
|
| 152 |
{
|
| 153 |
"part": "group_pre",
|
| 154 |
"idx": 30,
|
| 155 |
-
"precision": "
|
| 156 |
},
|
| 157 |
{
|
| 158 |
"part": "group_pre",
|
| 159 |
"idx": 31,
|
| 160 |
-
"precision": "
|
| 161 |
},
|
| 162 |
{
|
| 163 |
"part": "group_post",
|
| 164 |
"idx": 0,
|
| 165 |
-
"precision": "
|
| 166 |
},
|
| 167 |
{
|
| 168 |
"part": "group_post",
|
| 169 |
"idx": 1,
|
| 170 |
-
"precision": "
|
| 171 |
},
|
| 172 |
{
|
| 173 |
"part": "group_post",
|
| 174 |
"idx": 2,
|
| 175 |
-
"precision": "
|
| 176 |
},
|
| 177 |
{
|
| 178 |
"part": "group_post",
|
| 179 |
"idx": 3,
|
| 180 |
-
"precision": "
|
| 181 |
},
|
| 182 |
{
|
| 183 |
"part": "group_post",
|
| 184 |
"idx": 4,
|
| 185 |
-
"precision": "
|
| 186 |
},
|
| 187 |
{
|
| 188 |
"part": "group_post",
|
| 189 |
"idx": 5,
|
| 190 |
-
"precision": "
|
| 191 |
},
|
| 192 |
{
|
| 193 |
"part": "group_post",
|
| 194 |
"idx": 6,
|
| 195 |
-
"precision": "
|
| 196 |
},
|
| 197 |
{
|
| 198 |
"part": "group_post",
|
| 199 |
"idx": 7,
|
| 200 |
-
"precision": "
|
| 201 |
},
|
| 202 |
{
|
| 203 |
"part": "group_post",
|
| 204 |
"idx": 8,
|
| 205 |
-
"precision": "
|
| 206 |
},
|
| 207 |
{
|
| 208 |
"part": "group_post",
|
| 209 |
"idx": 9,
|
| 210 |
-
"precision": "
|
| 211 |
},
|
| 212 |
{
|
| 213 |
"part": "group_post",
|
| 214 |
"idx": 10,
|
| 215 |
-
"precision": "
|
| 216 |
},
|
| 217 |
{
|
| 218 |
"part": "group_post",
|
| 219 |
"idx": 11,
|
| 220 |
-
"precision": "
|
| 221 |
},
|
| 222 |
{
|
| 223 |
"part": "group_post",
|
| 224 |
"idx": 12,
|
| 225 |
-
"precision": "
|
| 226 |
},
|
| 227 |
{
|
| 228 |
"part": "group_post",
|
| 229 |
"idx": 13,
|
| 230 |
-
"precision": "
|
| 231 |
},
|
| 232 |
{
|
| 233 |
"part": "group_post",
|
| 234 |
"idx": 14,
|
| 235 |
-
"precision": "
|
| 236 |
},
|
| 237 |
{
|
| 238 |
"part": "group_post",
|
| 239 |
"idx": 15,
|
| 240 |
-
"precision": "
|
| 241 |
},
|
| 242 |
{
|
| 243 |
"part": "group_post",
|
| 244 |
"idx": 16,
|
| 245 |
-
"precision": "
|
| 246 |
},
|
| 247 |
{
|
| 248 |
"part": "group_post",
|
| 249 |
"idx": 17,
|
| 250 |
-
"precision": "
|
| 251 |
},
|
| 252 |
{
|
| 253 |
"part": "group_post",
|
| 254 |
"idx": 18,
|
| 255 |
-
"precision": "
|
| 256 |
},
|
| 257 |
{
|
| 258 |
"part": "group_post",
|
| 259 |
"idx": 19,
|
| 260 |
-
"precision": "
|
| 261 |
},
|
| 262 |
{
|
| 263 |
"part": "group_post",
|
| 264 |
"idx": 20,
|
| 265 |
-
"precision": "
|
| 266 |
},
|
| 267 |
{
|
| 268 |
"part": "group_post",
|
| 269 |
"idx": 21,
|
| 270 |
-
"precision": "
|
| 271 |
},
|
| 272 |
{
|
| 273 |
"part": "group_post",
|
| 274 |
"idx": 22,
|
| 275 |
-
"precision": "
|
| 276 |
},
|
| 277 |
{
|
| 278 |
"part": "group_post",
|
| 279 |
"idx": 23,
|
| 280 |
-
"precision": "
|
| 281 |
},
|
| 282 |
{
|
| 283 |
"part": "group_post",
|
| 284 |
"idx": 24,
|
| 285 |
-
"precision": "
|
| 286 |
},
|
| 287 |
{
|
| 288 |
"part": "group_post",
|
| 289 |
"idx": 25,
|
| 290 |
-
"precision": "
|
| 291 |
},
|
| 292 |
{
|
| 293 |
"part": "group_post",
|
| 294 |
"idx": 26,
|
| 295 |
-
"precision": "
|
| 296 |
},
|
| 297 |
{
|
| 298 |
"part": "group_post",
|
| 299 |
"idx": 27,
|
| 300 |
-
"precision": "
|
| 301 |
},
|
| 302 |
{
|
| 303 |
"part": "group_post",
|
| 304 |
"idx": 28,
|
| 305 |
-
"precision": "
|
| 306 |
},
|
| 307 |
{
|
| 308 |
"part": "group_post",
|
| 309 |
"idx": 29,
|
| 310 |
-
"precision": "
|
| 311 |
},
|
| 312 |
{
|
| 313 |
"part": "group_post",
|
| 314 |
"idx": 30,
|
| 315 |
-
"precision": "
|
| 316 |
},
|
| 317 |
{
|
| 318 |
"part": "group_cache",
|
| 319 |
"idx": 0,
|
| 320 |
-
"precision": "
|
| 321 |
},
|
| 322 |
{
|
| 323 |
"part": "group_cache",
|
| 324 |
"idx": 128,
|
| 325 |
-
"precision": "
|
| 326 |
},
|
| 327 |
{
|
| 328 |
"part": "group_cache",
|
| 329 |
"idx": 256,
|
| 330 |
-
"precision": "
|
| 331 |
},
|
| 332 |
{
|
| 333 |
"part": "group_cache",
|
| 334 |
"idx": 384,
|
| 335 |
-
"precision": "
|
| 336 |
},
|
| 337 |
{
|
| 338 |
"part": "group_cache",
|
| 339 |
"idx": 512,
|
| 340 |
-
"precision": "
|
| 341 |
},
|
| 342 |
{
|
| 343 |
"part": "group_cache",
|
| 344 |
"idx": 640,
|
| 345 |
-
"precision": "
|
| 346 |
},
|
| 347 |
{
|
| 348 |
"part": "group_cache",
|
| 349 |
"idx": 768,
|
| 350 |
-
"precision": "
|
| 351 |
},
|
| 352 |
{
|
| 353 |
"part": "group_cache",
|
| 354 |
"idx": 896,
|
| 355 |
-
"precision": "
|
| 356 |
},
|
| 357 |
{
|
| 358 |
"part": "group_cache",
|
| 359 |
"idx": 1024,
|
| 360 |
-
"precision": "
|
| 361 |
},
|
| 362 |
{
|
| 363 |
"part": "group_cache",
|
| 364 |
"idx": 1152,
|
| 365 |
-
"precision": "
|
| 366 |
},
|
| 367 |
{
|
| 368 |
"part": "group_cache",
|
| 369 |
"idx": 1280,
|
| 370 |
-
"precision": "
|
| 371 |
},
|
| 372 |
{
|
| 373 |
"part": "group_cache",
|
| 374 |
"idx": 1408,
|
| 375 |
-
"precision": "
|
| 376 |
},
|
| 377 |
{
|
| 378 |
"part": "group_cache",
|
| 379 |
"idx": 1536,
|
| 380 |
-
"precision": "
|
| 381 |
},
|
| 382 |
{
|
| 383 |
"part": "group_cache",
|
| 384 |
"idx": 1664,
|
| 385 |
-
"precision": "
|
| 386 |
},
|
| 387 |
{
|
| 388 |
"part": "group_cache",
|
| 389 |
"idx": 1792,
|
| 390 |
-
"precision": "
|
| 391 |
},
|
| 392 |
{
|
| 393 |
"part": "group_cache",
|
| 394 |
"idx": 1920,
|
| 395 |
-
"precision": "
|
| 396 |
},
|
| 397 |
{
|
| 398 |
"part": "single_pre",
|
|
|
|
| 2 |
{
|
| 3 |
"part": "group_pre",
|
| 4 |
"idx": 0,
|
| 5 |
+
"precision": "A_BF16_W_INT8"
|
| 6 |
},
|
| 7 |
{
|
| 8 |
"part": "group_pre",
|
| 9 |
"idx": 1,
|
| 10 |
+
"precision": "A_BF16_W_INT8"
|
| 11 |
},
|
| 12 |
{
|
| 13 |
"part": "group_pre",
|
| 14 |
"idx": 2,
|
| 15 |
+
"precision": "A_BF16_W_INT8"
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"part": "group_pre",
|
| 19 |
"idx": 3,
|
| 20 |
+
"precision": "A_BF16_W_INT8"
|
| 21 |
},
|
| 22 |
{
|
| 23 |
"part": "group_pre",
|
| 24 |
"idx": 4,
|
| 25 |
+
"precision": "A_BF16_W_INT8"
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"part": "group_pre",
|
| 29 |
"idx": 5,
|
| 30 |
+
"precision": "A_BF16_W_INT8"
|
| 31 |
},
|
| 32 |
{
|
| 33 |
"part": "group_pre",
|
| 34 |
"idx": 6,
|
| 35 |
+
"precision": "A_BF16_W_INT8"
|
| 36 |
},
|
| 37 |
{
|
| 38 |
"part": "group_pre",
|
| 39 |
"idx": 7,
|
| 40 |
+
"precision": "A_BF16_W_INT8"
|
| 41 |
},
|
| 42 |
{
|
| 43 |
"part": "group_pre",
|
| 44 |
"idx": 8,
|
| 45 |
+
"precision": "A_BF16_W_INT8"
|
| 46 |
},
|
| 47 |
{
|
| 48 |
"part": "group_pre",
|
| 49 |
"idx": 9,
|
| 50 |
+
"precision": "A_BF16_W_INT8"
|
| 51 |
},
|
| 52 |
{
|
| 53 |
"part": "group_pre",
|
| 54 |
"idx": 10,
|
| 55 |
+
"precision": "A_BF16_W_INT8"
|
| 56 |
},
|
| 57 |
{
|
| 58 |
"part": "group_pre",
|
| 59 |
"idx": 11,
|
| 60 |
+
"precision": "A_BF16_W_INT8"
|
| 61 |
},
|
| 62 |
{
|
| 63 |
"part": "group_pre",
|
| 64 |
"idx": 12,
|
| 65 |
+
"precision": "A_BF16_W_INT8"
|
| 66 |
},
|
| 67 |
{
|
| 68 |
"part": "group_pre",
|
| 69 |
"idx": 13,
|
| 70 |
+
"precision": "A_BF16_W_INT8"
|
| 71 |
},
|
| 72 |
{
|
| 73 |
"part": "group_pre",
|
| 74 |
"idx": 14,
|
| 75 |
+
"precision": "A_BF16_W_INT8"
|
| 76 |
},
|
| 77 |
{
|
| 78 |
"part": "group_pre",
|
| 79 |
"idx": 15,
|
| 80 |
+
"precision": "A_BF16_W_INT8"
|
| 81 |
},
|
| 82 |
{
|
| 83 |
"part": "group_pre",
|
| 84 |
"idx": 16,
|
| 85 |
+
"precision": "A_BF16_W_INT8"
|
| 86 |
},
|
| 87 |
{
|
| 88 |
"part": "group_pre",
|
| 89 |
"idx": 17,
|
| 90 |
+
"precision": "A_BF16_W_INT8"
|
| 91 |
},
|
| 92 |
{
|
| 93 |
"part": "group_pre",
|
| 94 |
"idx": 18,
|
| 95 |
+
"precision": "A_BF16_W_INT8"
|
| 96 |
},
|
| 97 |
{
|
| 98 |
"part": "group_pre",
|
| 99 |
"idx": 19,
|
| 100 |
+
"precision": "A_BF16_W_INT8"
|
| 101 |
},
|
| 102 |
{
|
| 103 |
"part": "group_pre",
|
| 104 |
"idx": 20,
|
| 105 |
+
"precision": "A_BF16_W_INT8"
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"part": "group_pre",
|
| 109 |
"idx": 21,
|
| 110 |
+
"precision": "A_BF16_W_INT8"
|
| 111 |
},
|
| 112 |
{
|
| 113 |
"part": "group_pre",
|
| 114 |
"idx": 22,
|
| 115 |
+
"precision": "A_BF16_W_INT8"
|
| 116 |
},
|
| 117 |
{
|
| 118 |
"part": "group_pre",
|
| 119 |
"idx": 23,
|
| 120 |
+
"precision": "A_BF16_W_INT8"
|
| 121 |
},
|
| 122 |
{
|
| 123 |
"part": "group_pre",
|
| 124 |
"idx": 24,
|
| 125 |
+
"precision": "A_BF16_W_INT8"
|
| 126 |
},
|
| 127 |
{
|
| 128 |
"part": "group_pre",
|
| 129 |
"idx": 25,
|
| 130 |
+
"precision": "A_BF16_W_INT8"
|
| 131 |
},
|
| 132 |
{
|
| 133 |
"part": "group_pre",
|
| 134 |
"idx": 26,
|
| 135 |
+
"precision": "A_BF16_W_INT8"
|
| 136 |
},
|
| 137 |
{
|
| 138 |
"part": "group_pre",
|
| 139 |
"idx": 27,
|
| 140 |
+
"precision": "A_BF16_W_INT8"
|
| 141 |
},
|
| 142 |
{
|
| 143 |
"part": "group_pre",
|
| 144 |
"idx": 28,
|
| 145 |
+
"precision": "A_BF16_W_INT8"
|
| 146 |
},
|
| 147 |
{
|
| 148 |
"part": "group_pre",
|
| 149 |
"idx": 29,
|
| 150 |
+
"precision": "A_BF16_W_INT8"
|
| 151 |
},
|
| 152 |
{
|
| 153 |
"part": "group_pre",
|
| 154 |
"idx": 30,
|
| 155 |
+
"precision": "A_BF16_W_INT8"
|
| 156 |
},
|
| 157 |
{
|
| 158 |
"part": "group_pre",
|
| 159 |
"idx": 31,
|
| 160 |
+
"precision": "A_BF16_W_INT8"
|
| 161 |
},
|
| 162 |
{
|
| 163 |
"part": "group_post",
|
| 164 |
"idx": 0,
|
| 165 |
+
"precision": "A_BF16_W_INT8"
|
| 166 |
},
|
| 167 |
{
|
| 168 |
"part": "group_post",
|
| 169 |
"idx": 1,
|
| 170 |
+
"precision": "A_BF16_W_INT8"
|
| 171 |
},
|
| 172 |
{
|
| 173 |
"part": "group_post",
|
| 174 |
"idx": 2,
|
| 175 |
+
"precision": "A_BF16_W_INT8"
|
| 176 |
},
|
| 177 |
{
|
| 178 |
"part": "group_post",
|
| 179 |
"idx": 3,
|
| 180 |
+
"precision": "A_BF16_W_INT8"
|
| 181 |
},
|
| 182 |
{
|
| 183 |
"part": "group_post",
|
| 184 |
"idx": 4,
|
| 185 |
+
"precision": "A_BF16_W_INT8"
|
| 186 |
},
|
| 187 |
{
|
| 188 |
"part": "group_post",
|
| 189 |
"idx": 5,
|
| 190 |
+
"precision": "A_BF16_W_INT8"
|
| 191 |
},
|
| 192 |
{
|
| 193 |
"part": "group_post",
|
| 194 |
"idx": 6,
|
| 195 |
+
"precision": "A_BF16_W_INT8"
|
| 196 |
},
|
| 197 |
{
|
| 198 |
"part": "group_post",
|
| 199 |
"idx": 7,
|
| 200 |
+
"precision": "A_BF16_W_INT8"
|
| 201 |
},
|
| 202 |
{
|
| 203 |
"part": "group_post",
|
| 204 |
"idx": 8,
|
| 205 |
+
"precision": "A_BF16_W_INT8"
|
| 206 |
},
|
| 207 |
{
|
| 208 |
"part": "group_post",
|
| 209 |
"idx": 9,
|
| 210 |
+
"precision": "A_BF16_W_INT8"
|
| 211 |
},
|
| 212 |
{
|
| 213 |
"part": "group_post",
|
| 214 |
"idx": 10,
|
| 215 |
+
"precision": "A_BF16_W_INT8"
|
| 216 |
},
|
| 217 |
{
|
| 218 |
"part": "group_post",
|
| 219 |
"idx": 11,
|
| 220 |
+
"precision": "A_BF16_W_INT8"
|
| 221 |
},
|
| 222 |
{
|
| 223 |
"part": "group_post",
|
| 224 |
"idx": 12,
|
| 225 |
+
"precision": "A_BF16_W_INT8"
|
| 226 |
},
|
| 227 |
{
|
| 228 |
"part": "group_post",
|
| 229 |
"idx": 13,
|
| 230 |
+
"precision": "A_BF16_W_INT8"
|
| 231 |
},
|
| 232 |
{
|
| 233 |
"part": "group_post",
|
| 234 |
"idx": 14,
|
| 235 |
+
"precision": "A_BF16_W_INT8"
|
| 236 |
},
|
| 237 |
{
|
| 238 |
"part": "group_post",
|
| 239 |
"idx": 15,
|
| 240 |
+
"precision": "A_BF16_W_INT8"
|
| 241 |
},
|
| 242 |
{
|
| 243 |
"part": "group_post",
|
| 244 |
"idx": 16,
|
| 245 |
+
"precision": "A_BF16_W_INT8"
|
| 246 |
},
|
| 247 |
{
|
| 248 |
"part": "group_post",
|
| 249 |
"idx": 17,
|
| 250 |
+
"precision": "A_BF16_W_INT8"
|
| 251 |
},
|
| 252 |
{
|
| 253 |
"part": "group_post",
|
| 254 |
"idx": 18,
|
| 255 |
+
"precision": "A_BF16_W_INT8"
|
| 256 |
},
|
| 257 |
{
|
| 258 |
"part": "group_post",
|
| 259 |
"idx": 19,
|
| 260 |
+
"precision": "A_BF16_W_INT8"
|
| 261 |
},
|
| 262 |
{
|
| 263 |
"part": "group_post",
|
| 264 |
"idx": 20,
|
| 265 |
+
"precision": "A_BF16_W_INT8"
|
| 266 |
},
|
| 267 |
{
|
| 268 |
"part": "group_post",
|
| 269 |
"idx": 21,
|
| 270 |
+
"precision": "A_BF16_W_INT8"
|
| 271 |
},
|
| 272 |
{
|
| 273 |
"part": "group_post",
|
| 274 |
"idx": 22,
|
| 275 |
+
"precision": "A_BF16_W_INT8"
|
| 276 |
},
|
| 277 |
{
|
| 278 |
"part": "group_post",
|
| 279 |
"idx": 23,
|
| 280 |
+
"precision": "A_BF16_W_INT8"
|
| 281 |
},
|
| 282 |
{
|
| 283 |
"part": "group_post",
|
| 284 |
"idx": 24,
|
| 285 |
+
"precision": "A_BF16_W_INT8"
|
| 286 |
},
|
| 287 |
{
|
| 288 |
"part": "group_post",
|
| 289 |
"idx": 25,
|
| 290 |
+
"precision": "A_BF16_W_INT8"
|
| 291 |
},
|
| 292 |
{
|
| 293 |
"part": "group_post",
|
| 294 |
"idx": 26,
|
| 295 |
+
"precision": "A_BF16_W_INT8"
|
| 296 |
},
|
| 297 |
{
|
| 298 |
"part": "group_post",
|
| 299 |
"idx": 27,
|
| 300 |
+
"precision": "A_BF16_W_INT8"
|
| 301 |
},
|
| 302 |
{
|
| 303 |
"part": "group_post",
|
| 304 |
"idx": 28,
|
| 305 |
+
"precision": "A_BF16_W_INT8"
|
| 306 |
},
|
| 307 |
{
|
| 308 |
"part": "group_post",
|
| 309 |
"idx": 29,
|
| 310 |
+
"precision": "A_BF16_W_INT8"
|
| 311 |
},
|
| 312 |
{
|
| 313 |
"part": "group_post",
|
| 314 |
"idx": 30,
|
| 315 |
+
"precision": "A_BF16_W_INT8"
|
| 316 |
},
|
| 317 |
{
|
| 318 |
"part": "group_cache",
|
| 319 |
"idx": 0,
|
| 320 |
+
"precision": "A_BF16_W_INT8"
|
| 321 |
},
|
| 322 |
{
|
| 323 |
"part": "group_cache",
|
| 324 |
"idx": 128,
|
| 325 |
+
"precision": "A_BF16_W_INT8"
|
| 326 |
},
|
| 327 |
{
|
| 328 |
"part": "group_cache",
|
| 329 |
"idx": 256,
|
| 330 |
+
"precision": "A_BF16_W_INT8"
|
| 331 |
},
|
| 332 |
{
|
| 333 |
"part": "group_cache",
|
| 334 |
"idx": 384,
|
| 335 |
+
"precision": "A_BF16_W_INT8"
|
| 336 |
},
|
| 337 |
{
|
| 338 |
"part": "group_cache",
|
| 339 |
"idx": 512,
|
| 340 |
+
"precision": "A_BF16_W_INT8"
|
| 341 |
},
|
| 342 |
{
|
| 343 |
"part": "group_cache",
|
| 344 |
"idx": 640,
|
| 345 |
+
"precision": "A_BF16_W_INT8"
|
| 346 |
},
|
| 347 |
{
|
| 348 |
"part": "group_cache",
|
| 349 |
"idx": 768,
|
| 350 |
+
"precision": "A_BF16_W_INT8"
|
| 351 |
},
|
| 352 |
{
|
| 353 |
"part": "group_cache",
|
| 354 |
"idx": 896,
|
| 355 |
+
"precision": "A_BF16_W_INT8"
|
| 356 |
},
|
| 357 |
{
|
| 358 |
"part": "group_cache",
|
| 359 |
"idx": 1024,
|
| 360 |
+
"precision": "A_BF16_W_INT8"
|
| 361 |
},
|
| 362 |
{
|
| 363 |
"part": "group_cache",
|
| 364 |
"idx": 1152,
|
| 365 |
+
"precision": "A_BF16_W_INT8"
|
| 366 |
},
|
| 367 |
{
|
| 368 |
"part": "group_cache",
|
| 369 |
"idx": 1280,
|
| 370 |
+
"precision": "A_BF16_W_INT8"
|
| 371 |
},
|
| 372 |
{
|
| 373 |
"part": "group_cache",
|
| 374 |
"idx": 1408,
|
| 375 |
+
"precision": "A_BF16_W_INT8"
|
| 376 |
},
|
| 377 |
{
|
| 378 |
"part": "group_cache",
|
| 379 |
"idx": 1536,
|
| 380 |
+
"precision": "A_BF16_W_INT8"
|
| 381 |
},
|
| 382 |
{
|
| 383 |
"part": "group_cache",
|
| 384 |
"idx": 1664,
|
| 385 |
+
"precision": "A_BF16_W_INT8"
|
| 386 |
},
|
| 387 |
{
|
| 388 |
"part": "group_cache",
|
| 389 |
"idx": 1792,
|
| 390 |
+
"precision": "A_BF16_W_INT8"
|
| 391 |
},
|
| 392 |
{
|
| 393 |
"part": "group_cache",
|
| 394 |
"idx": 1920,
|
| 395 |
+
"precision": "A_BF16_W_INT8"
|
| 396 |
},
|
| 397 |
{
|
| 398 |
"part": "single_pre",
|
devkit/vlm_config.json
CHANGED
|
@@ -58,6 +58,7 @@
|
|
| 58 |
},
|
| 59 |
"pipeline_cfg": {
|
| 60 |
"system_prompt": null,
|
|
|
|
| 61 |
"max_num_tokens": 2048,
|
| 62 |
"input_token_group_size": 128,
|
| 63 |
"input_token_group_offsets": [
|
|
|
|
| 58 |
},
|
| 59 |
"pipeline_cfg": {
|
| 60 |
"system_prompt": null,
|
| 61 |
+
"chat_template": null,
|
| 62 |
"max_num_tokens": 2048,
|
| 63 |
"input_token_group_size": 128,
|
| 64 |
"input_token_group_offsets": [
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token0_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97f7225ec5001f8d7eaecccf8968183cb3210a187938eec9153726875b509e12
|
| 3 |
+
size 4240016
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1024_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:763eae829c00cd5763d2ceb6cef99d9f4af626ff9654b8e3e2e1107e3dce0fbc
|
| 3 |
+
size 11947200
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1152_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89b8f3448c5f9c9bc697223a4690b61f473c790517c9e536544b16d329fcf747
|
| 3 |
+
size 14312472
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1280_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7513575be5269025d73aa7e47bdffc61dc9efe3e88d486a68a65f2d32cf8dc96
|
| 3 |
+
size 13877000
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token128_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33b80180cfd64edbe73f7a112026b593dbc0db19f63d76dad93bf4f5f85ecb75
|
| 3 |
+
size 4589520
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1408_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9646b2ee00296dcd2388428a9de95f9f81e7b5c4882fc074c3d9bf1e48d448e0
|
| 3 |
+
size 16241328
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1536_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1b6a774e18e211bfe5ad6bcb274440b0c88e40795daee95e1792968027557ee
|
| 3 |
+
size 17234088
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1664_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efa38ce1343e1e211009754db74baedc487043b8062a4f828828287b966850ad
|
| 3 |
+
size 17028880
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1792_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:464df902cad97f55e207f08df10e7a5496d0a26822ef4dad01aef7268cb9dc59
|
| 3 |
+
size 17311696
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token1920_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfa2613dc103461e2cb9703ffb5d86d5a2ea286c8b38e0720bd96721e332fa0a
|
| 3 |
+
size 18200312
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token256_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce69cdfe040d984e4c7f3dd3e38963225d9d23762f4d4d40950f03481dc95501
|
| 3 |
+
size 4716480
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token384_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4dd52462033ce61ff08760045c26a587586e64c6b59b9e1ba96e3ec7881e8b91
|
| 3 |
+
size 6127904
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token512_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27cf5a5e974d2edc36cc6a1a82efc950da307381a3929cbb331fdad74f568344
|
| 3 |
+
size 6492640
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token640_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bd6a756a8abb52be2103db517589c22d75834159957466bd030c4ea723fae5d2
|
| 3 |
+
size 7985248
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token768_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22d57de5899d3be2dabedcdcac29fca6e362f6eb5c47ccc71b86d88577545123
|
| 3 |
+
size 10248464
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_cache_token896_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47ade818ffceeafd01ce7c8d1a1cf6af4a0b0cc360214e400f72f4851863430e
|
| 3 |
+
size 10592440
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer0_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c25ad95ee3a0a6db3b058054b88be65fb6fc7c42ed18eaa69049bf0226c84a51
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer10_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:624b3ee8f354635f99400d52eb25ca8e4efb2d64f706db83a24b1de460645401
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer11_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ecc0e9fa065faabd982709d1b43517d59148b980999ed50550ec5e2e3bc8a18
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer12_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a35f716c26965facc09ad7cfdf68504c3c18ce0f9230cf27be4765420096f0e7
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer13_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8580e6066049d52ff2ffcc888afb0eb9cedcce7b6f7bf5351a8051a224d4ec19
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer14_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02439d491d45adca1fdd82d206d7b3fe29e220c1f79351b92d0c90a6b7428940
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer15_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ab0088da4413cb52d31b957194b816237bf68f05c9a79a154df712ea46166c9
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer16_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5744d6bd9d532e1f0830eca4847b8eac391032b131ee97e8ca392676c6d0f44
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer17_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0b4b322d097d9b8689e0682001bf6917b76c5ccd617f7e92fb656fba76ab720
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer18_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff53bd3c5fd667c092dd7ec9a9cba060b53481996224fd02a4d2837683802ded
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer19_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d78f9c7303ccd2bc0ba34be61e128247a911b63b535fa690109d24323c8db12
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer1_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25133416797b0c9000ba1dfebbbde19dab740cd1e73a2fe644d5556b840d2c1c
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer20_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a14ba40ace148a42c858e5a6db175d1f3fe182b3f91073f5801b79b0012d673
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer21_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f58d7cd6279d42eb3666f7367ae9e5ea7c0e33743069f9411efee1924a87d7a
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer22_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ca894a2b5465f1c82ae70d79e611fdfc5fac95ce623f84121706d912c3315fa
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer23_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bafe95dba0cf621cb8f52da6f8745df375aa3a3ee969591083ab9bf643f9af2d
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer24_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9915f47651c8b43557de4723346f80d5c7de009163a3ece8866602fdab739a51
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer25_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aede89a4ed26c487954677784e75c4740a83bc19de19695a98715104edbae52a
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer26_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fc5a1d05d540ab15047386b972eb436a6c675755bf7b4ce315e64bc5ff71edf
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer27_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e32b337ecddabb0768c77a9d54379a443d5fc945bc084137d68c8960f8b30d9d
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer28_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41a679bf4319c7f4d38532420332b9b8a4bfb82957385bbe2b34db776e235b0c
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer29_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb01ee25042e96fd763397574ecd45235977ce666aa7dfc9dac439efd01b619a
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer2_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cd7871ffc8f0405ca54fb82f2d0aa837497b9c76a134b1dc38237a55f2e2c12
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer30_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66671b9cc9c4cfdd350346910a0faf1f5d9f1f923a4e906d1d62fe5d53e756d4
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer3_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5802c98bcb45cd6528e2be14f786126e1c7f27895513c71b9f5324d2eccfaadb
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer4_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e118ba9974dea80e73524d0b5ba99058f9fd23b0a5411f2f5cb3f2865a2e8792
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer5_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4763377bf6b4e4c966cc1629046357a43f39f839b8f2f79249071a953f9b5703
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer6_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0725234ea4ac26dc4dcd9938f695a099d29b9ffebbb7d8b64b1aa3fb44e9bd77
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer7_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b9950dc1ce5aa42d85900da1e3c1c061e236f4dcdcbc0b8fed6576c84b35f3a
|
| 3 |
+
size 220746936
|
elf_files/models--mistralai--Mistral-7B-Instruct-v0.3_language_n128_post_layer8_stage1_mla.elf
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79a05328b50baf4f6459e62d7d3944542e251cb422b7dbe223d16d7c415814ff
|
| 3 |
+
size 220746936
|