Upload 8 files
Browse files- config.json +3 -3
- generation_config.json +1 -1
- tokenizer_config.json +1 -1
config.json
CHANGED
|
@@ -7,6 +7,7 @@
|
|
| 7 |
"attention_dropout": 0.0,
|
| 8 |
"attn_logit_softcapping": null,
|
| 9 |
"bos_token_id": 2,
|
|
|
|
| 10 |
"eos_token_id": 106,
|
| 11 |
"final_logit_softcapping": null,
|
| 12 |
"head_dim": 256,
|
|
@@ -46,10 +47,9 @@
|
|
| 46 |
"rope_scaling": null,
|
| 47 |
"rope_theta": 1000000.0,
|
| 48 |
"sliding_window": 512,
|
| 49 |
-
"
|
| 50 |
-
"transformers_version": "4.55.3",
|
| 51 |
"unsloth_fixed": true,
|
| 52 |
-
"unsloth_version": "2025.
|
| 53 |
"use_bidirectional_attention": false,
|
| 54 |
"use_cache": true,
|
| 55 |
"vocab_size": 262144
|
|
|
|
| 7 |
"attention_dropout": 0.0,
|
| 8 |
"attn_logit_softcapping": null,
|
| 9 |
"bos_token_id": 2,
|
| 10 |
+
"dtype": "bfloat16",
|
| 11 |
"eos_token_id": 106,
|
| 12 |
"final_logit_softcapping": null,
|
| 13 |
"head_dim": 256,
|
|
|
|
| 47 |
"rope_scaling": null,
|
| 48 |
"rope_theta": 1000000.0,
|
| 49 |
"sliding_window": 512,
|
| 50 |
+
"transformers_version": "4.57.2",
|
|
|
|
| 51 |
"unsloth_fixed": true,
|
| 52 |
+
"unsloth_version": "2025.11.4",
|
| 53 |
"use_bidirectional_attention": false,
|
| 54 |
"use_cache": true,
|
| 55 |
"vocab_size": 262144
|
generation_config.json
CHANGED
|
@@ -10,5 +10,5 @@
|
|
| 10 |
"pad_token_id": 0,
|
| 11 |
"top_k": 64,
|
| 12 |
"top_p": 0.95,
|
| 13 |
-
"transformers_version": "4.
|
| 14 |
}
|
|
|
|
| 10 |
"pad_token_id": 0,
|
| 11 |
"top_k": 64,
|
| 12 |
"top_p": 0.95,
|
| 13 |
+
"transformers_version": "4.57.2"
|
| 14 |
}
|
tokenizer_config.json
CHANGED
|
@@ -51336,7 +51336,7 @@
|
|
| 51336 |
"image_token": "<image_soft_token>",
|
| 51337 |
"model_max_length": 32768,
|
| 51338 |
"pad_token": "<pad>",
|
| 51339 |
-
"padding_side": "
|
| 51340 |
"sp_model_kwargs": null,
|
| 51341 |
"spaces_between_special_tokens": false,
|
| 51342 |
"tokenizer_class": "GemmaTokenizer",
|
|
|
|
| 51336 |
"image_token": "<image_soft_token>",
|
| 51337 |
"model_max_length": 32768,
|
| 51338 |
"pad_token": "<pad>",
|
| 51339 |
+
"padding_side": "left",
|
| 51340 |
"sp_model_kwargs": null,
|
| 51341 |
"spaces_between_special_tokens": false,
|
| 51342 |
"tokenizer_class": "GemmaTokenizer",
|