Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +5 -0
- global_step_10/data.pt +3 -0
- global_step_100/data.pt +3 -0
- global_step_110/data.pt +3 -0
- global_step_120/data.pt +3 -0
- global_step_130/data.pt +3 -0
- global_step_140/data.pt +3 -0
- global_step_150/data.pt +3 -0
- global_step_160/data.pt +3 -0
- global_step_170/data.pt +3 -0
- global_step_180/data.pt +3 -0
- global_step_190/data.pt +3 -0
- global_step_20/data.pt +3 -0
- global_step_200/data.pt +3 -0
- global_step_210/data.pt +3 -0
- global_step_220/data.pt +3 -0
- global_step_230/data.pt +3 -0
- global_step_240/data.pt +3 -0
- global_step_250/data.pt +3 -0
- global_step_260/data.pt +3 -0
- global_step_270/data.pt +3 -0
- global_step_280/data.pt +3 -0
- global_step_290/data.pt +3 -0
- global_step_30/data.pt +3 -0
- global_step_300/data.pt +3 -0
- global_step_310/data.pt +3 -0
- global_step_320/data.pt +3 -0
- global_step_330/data.pt +3 -0
- global_step_340/data.pt +3 -0
- global_step_350/data.pt +3 -0
- global_step_360/data.pt +3 -0
- global_step_370/data.pt +3 -0
- global_step_380/data.pt +3 -0
- global_step_390/data.pt +3 -0
- global_step_40/data.pt +3 -0
- global_step_400/data.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_0.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_1.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_2.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_3.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_4.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_5.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_6.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_7.pt +3 -0
- global_step_410/actor/fsdp_config.json +4 -0
- global_step_410/actor/huggingface/added_tokens.json +24 -0
- global_step_410/actor/huggingface/config.json +30 -0
- global_step_410/actor/huggingface/generation_config.json +6 -0
- global_step_410/actor/huggingface/merges.txt +0 -0
- global_step_410/actor/huggingface/special_tokens_map.json +31 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
global_step_410/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
global_step_420/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
global_step_430/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
global_step_440/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
global_step_444/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
global_step_10/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f6fc06061c18de82c1bff536c8d1c4b98f4633642f047e7412d35d875b3c80dc
|
| 3 |
+
size 1492
|
global_step_100/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:407653bd4760b1e440f3aaa36dfac7a28063c8a546943744a167fbce1940a009
|
| 3 |
+
size 1492
|
global_step_110/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5816bdbe347af5cfcc78fa754198e1a17af58551902356a81196d915d321f45
|
| 3 |
+
size 1492
|
global_step_120/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e242e96f61df19dfb9bbde623c4254a7da8ff50758f00d18d705acc72b997592
|
| 3 |
+
size 1492
|
global_step_130/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5979aa467be1e536d8e417f42bdf7725360ea09b192472b90b1336f1a795f344
|
| 3 |
+
size 1492
|
global_step_140/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5dc11924e124a96f8405030ac3a502567470c942fc2e0ce50a926e6756ea6804
|
| 3 |
+
size 1492
|
global_step_150/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:34312f7f90f7d02cd54422f373db7ae73288619441d727408f8095b8e743d93c
|
| 3 |
+
size 1492
|
global_step_160/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4beafb3903a61a5b8931b2244c9646d86f3323b220cbd7ef8e0a4f7c5ebe50c6
|
| 3 |
+
size 1492
|
global_step_170/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:324e3c63297dbbb0896ace53e437fde8c16bedfdd4b9ff3622b5f82765a495c8
|
| 3 |
+
size 1492
|
global_step_180/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d57cb5f126397d905ce3934b2ff234038015504ea623830feb44c36f67aad769
|
| 3 |
+
size 1492
|
global_step_190/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8dcc9a7e9c6692133ba40e987626b791a8f641fe5d855146e6aa1181683ba3cd
|
| 3 |
+
size 1492
|
global_step_20/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a39167e06ff02c838a85e0ff9bb15b0cb6d31a7a5cd9b6585701cf0959d11cbd
|
| 3 |
+
size 1492
|
global_step_200/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a7abf0ebf41e4db9e7050db9b25a69ec5a39a54089461a592a08b4597d152a77
|
| 3 |
+
size 1492
|
global_step_210/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6838cb9498d35d1b52c9ff7498f9827392d4203a10128ea75633395fc63cfbeb
|
| 3 |
+
size 1492
|
global_step_220/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b974931ed4f9ecc59001485f7c3c0b7bca70b43b8946a47df6ae98912702f385
|
| 3 |
+
size 1492
|
global_step_230/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ea2acfa13a27a676f9fccfb3eb6206aa449ca270df83d18a2ec06f8b986681d
|
| 3 |
+
size 1492
|
global_step_240/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:076b37140e866ec73443ba4bee36b2de1c2530f912f924ad044135c66f70d6dd
|
| 3 |
+
size 1492
|
global_step_250/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba141180adfc87ee092b3e29b2acb95ff3efc69f9218c5a6a70a105569158f60
|
| 3 |
+
size 1492
|
global_step_260/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1fa67b155a8ab2e27b76c73d55f7d01b779c2c77ea4015f0b387d4d38be1af0d
|
| 3 |
+
size 1556
|
global_step_270/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c16a501a067b4e4cd9221ed51920cdd93b6aa407489190cdc219bd0d36cdff3c
|
| 3 |
+
size 1556
|
global_step_280/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4cab060318e24f1bcaed728dcaeb281197395b8142041bf0c8cbd037be60477
|
| 3 |
+
size 1556
|
global_step_290/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e80c8fadcf99481ae9c19d1ea9bcc656d233754ca4477104f310abff9de2c550
|
| 3 |
+
size 1556
|
global_step_30/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef17218db9540c8867f8d02fb009d26d7f8687d94da5de0359073f696685d072
|
| 3 |
+
size 1492
|
global_step_300/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31070d05a53ef1bb5fbff1eb2e26a7275c25f91b30b5e531017a83256e27e012
|
| 3 |
+
size 1556
|
global_step_310/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2162c5204e957c4d9e49cbae530e7057035c63f467792b2ed7cf6dba51bc1a47
|
| 3 |
+
size 1556
|
global_step_320/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57b5bd505dc9b97a1d6990040da3ca6352855aaf4f6d5910ec91339efd9ae58c
|
| 3 |
+
size 1556
|
global_step_330/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee48d6295ae72fbf082011ec9b31252187c05e7e7a1576994751af51874557f5
|
| 3 |
+
size 1556
|
global_step_340/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:303e193e32baf38eff6fd45eae035b166ca0ddc0d4677e05b67e464e44900995
|
| 3 |
+
size 1556
|
global_step_350/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20d8d0c273a118408154c8c91a7389a26828515b387706b4366dd34731f289c7
|
| 3 |
+
size 1556
|
global_step_360/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80389a6ab5414b746c0a9057f79847873259626504d2d97d2b1020d0ecb372e0
|
| 3 |
+
size 1556
|
global_step_370/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bee5e740a65f2131b9cf6df35ef0e240ab4cb884cd226f0c0ebffdd0cdbcc1fe
|
| 3 |
+
size 1556
|
global_step_380/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c22dab01cda0946c739f64fff7b8555c745123e8c75b45c6e523f9a535e5516
|
| 3 |
+
size 1556
|
global_step_390/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0bc4b483ead790e3d4787d4f4b723947d4861a465102f0b96fa6a1064ac1503
|
| 3 |
+
size 1556
|
global_step_40/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8c180e6b75954c8fa351e0ac2218ff7dd7ac1477cc145b96118eff939ce6eca
|
| 3 |
+
size 1492
|
global_step_400/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f85a323664c3aa91198f23f964bdc120acbd442c0c6b7520c0c3c52cb3e47001
|
| 3 |
+
size 1556
|
global_step_410/actor/extra_state_world_size_8_rank_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05b3ba55c9ab6f3006692a7c6183587902010dfd80b4ec0dde50c9a56f489b20
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:936d9887d3ff3688cc3a2ea9298b8ca0531f83b612463829b9dee248647925d6
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:408538fda8acacabcdec600c3b52d58f33fc116146fdfff08ad8dad398f2c7dc
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2da863bf61902e45b320b63a58adebeda67a457be79b67057d0e53591ac9f89
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cecd819e59aee6a4a807036b2067ac751192cf69b917a5a598adb6c2bc67651b
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97b4f0ec301ea549313d6f189a6078cc8e76af2155a10640ff7349f6710521f7
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:637234e33bd402a548e946634ebe04fd7f62954964ee7fe36933221d2fdab47c
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b18f4e1215deeeab897b1128842ca688e1bc80566906e3b5834f2445d60675f4
|
| 3 |
+
size 14632
|
global_step_410/actor/fsdp_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"FSDP_version": 1,
|
| 3 |
+
"world_size": 8
|
| 4 |
+
}
|
global_step_410/actor/huggingface/added_tokens.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"</tool_call>": 151658,
|
| 3 |
+
"<tool_call>": 151657,
|
| 4 |
+
"<|box_end|>": 151649,
|
| 5 |
+
"<|box_start|>": 151648,
|
| 6 |
+
"<|endoftext|>": 151643,
|
| 7 |
+
"<|file_sep|>": 151664,
|
| 8 |
+
"<|fim_middle|>": 151660,
|
| 9 |
+
"<|fim_pad|>": 151662,
|
| 10 |
+
"<|fim_prefix|>": 151659,
|
| 11 |
+
"<|fim_suffix|>": 151661,
|
| 12 |
+
"<|im_end|>": 151645,
|
| 13 |
+
"<|im_start|>": 151644,
|
| 14 |
+
"<|image_pad|>": 151655,
|
| 15 |
+
"<|object_ref_end|>": 151647,
|
| 16 |
+
"<|object_ref_start|>": 151646,
|
| 17 |
+
"<|quad_end|>": 151651,
|
| 18 |
+
"<|quad_start|>": 151650,
|
| 19 |
+
"<|repo_name|>": 151663,
|
| 20 |
+
"<|video_pad|>": 151656,
|
| 21 |
+
"<|vision_end|>": 151653,
|
| 22 |
+
"<|vision_pad|>": 151654,
|
| 23 |
+
"<|vision_start|>": 151652
|
| 24 |
+
}
|
global_step_410/actor/huggingface/config.json
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_attn_implementation_autoset": true,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"Qwen2ForCausalLM"
|
| 5 |
+
],
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"eos_token_id": 151643,
|
| 8 |
+
"hidden_act": "silu",
|
| 9 |
+
"hidden_size": 1536,
|
| 10 |
+
"initializer_range": 0.02,
|
| 11 |
+
"intermediate_size": 8960,
|
| 12 |
+
"max_position_embeddings": 4096,
|
| 13 |
+
"max_window_layers": 21,
|
| 14 |
+
"model_type": "qwen2",
|
| 15 |
+
"num_attention_heads": 12,
|
| 16 |
+
"num_hidden_layers": 28,
|
| 17 |
+
"num_key_value_heads": 2,
|
| 18 |
+
"pad_token_id": 151643,
|
| 19 |
+
"rms_norm_eps": 1e-06,
|
| 20 |
+
"rope_scaling": null,
|
| 21 |
+
"rope_theta": 10000,
|
| 22 |
+
"sliding_window": 4096,
|
| 23 |
+
"tie_word_embeddings": true,
|
| 24 |
+
"torch_dtype": "float32",
|
| 25 |
+
"transformers_version": "4.51.1",
|
| 26 |
+
"use_cache": true,
|
| 27 |
+
"use_mrope": false,
|
| 28 |
+
"use_sliding_window": false,
|
| 29 |
+
"vocab_size": 151936
|
| 30 |
+
}
|
global_step_410/actor/huggingface/generation_config.json
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 151643,
|
| 3 |
+
"eos_token_id": 151643,
|
| 4 |
+
"max_new_tokens": 2048,
|
| 5 |
+
"transformers_version": "4.51.1"
|
| 6 |
+
}
|
global_step_410/actor/huggingface/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
global_step_410/actor/huggingface/special_tokens_map.json
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"additional_special_tokens": [
|
| 3 |
+
"<|im_start|>",
|
| 4 |
+
"<|im_end|>",
|
| 5 |
+
"<|object_ref_start|>",
|
| 6 |
+
"<|object_ref_end|>",
|
| 7 |
+
"<|box_start|>",
|
| 8 |
+
"<|box_end|>",
|
| 9 |
+
"<|quad_start|>",
|
| 10 |
+
"<|quad_end|>",
|
| 11 |
+
"<|vision_start|>",
|
| 12 |
+
"<|vision_end|>",
|
| 13 |
+
"<|vision_pad|>",
|
| 14 |
+
"<|image_pad|>",
|
| 15 |
+
"<|video_pad|>"
|
| 16 |
+
],
|
| 17 |
+
"eos_token": {
|
| 18 |
+
"content": "<|endoftext|>",
|
| 19 |
+
"lstrip": false,
|
| 20 |
+
"normalized": false,
|
| 21 |
+
"rstrip": false,
|
| 22 |
+
"single_word": false
|
| 23 |
+
},
|
| 24 |
+
"pad_token": {
|
| 25 |
+
"content": "<|endoftext|>",
|
| 26 |
+
"lstrip": false,
|
| 27 |
+
"normalized": false,
|
| 28 |
+
"rstrip": false,
|
| 29 |
+
"single_word": false
|
| 30 |
+
}
|
| 31 |
+
}
|