Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +5 -0
- global_step_10/data.pt +3 -0
- global_step_100/data.pt +3 -0
- global_step_110/data.pt +3 -0
- global_step_120/data.pt +3 -0
- global_step_130/data.pt +3 -0
- global_step_140/data.pt +3 -0
- global_step_150/data.pt +3 -0
- global_step_160/data.pt +3 -0
- global_step_170/data.pt +3 -0
- global_step_180/data.pt +3 -0
- global_step_190/data.pt +3 -0
- global_step_20/data.pt +3 -0
- global_step_200/data.pt +3 -0
- global_step_210/data.pt +3 -0
- global_step_220/data.pt +3 -0
- global_step_230/data.pt +3 -0
- global_step_240/data.pt +3 -0
- global_step_250/data.pt +3 -0
- global_step_260/data.pt +3 -0
- global_step_270/data.pt +3 -0
- global_step_280/data.pt +3 -0
- global_step_290/data.pt +3 -0
- global_step_30/data.pt +3 -0
- global_step_300/data.pt +3 -0
- global_step_310/data.pt +3 -0
- global_step_320/data.pt +3 -0
- global_step_330/data.pt +3 -0
- global_step_340/data.pt +3 -0
- global_step_350/data.pt +3 -0
- global_step_360/data.pt +3 -0
- global_step_370/data.pt +3 -0
- global_step_380/data.pt +3 -0
- global_step_390/data.pt +3 -0
- global_step_40/data.pt +3 -0
- global_step_400/data.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_0.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_1.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_2.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_3.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_4.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_5.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_6.pt +3 -0
- global_step_410/actor/extra_state_world_size_8_rank_7.pt +3 -0
- global_step_410/actor/fsdp_config.json +4 -0
- global_step_410/actor/huggingface/added_tokens.json +24 -0
- global_step_410/actor/huggingface/config.json +30 -0
- global_step_410/actor/huggingface/generation_config.json +6 -0
- global_step_410/actor/huggingface/merges.txt +0 -0
- global_step_410/actor/huggingface/special_tokens_map.json +31 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
global_step_410/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
global_step_420/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
global_step_430/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
global_step_440/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
global_step_444/actor/huggingface/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
global_step_10/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf391c04dbda1311964af7b9c141d2afd529b83aff61fd4da85d656fa353638d
|
| 3 |
+
size 1492
|
global_step_100/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30c6c5d1c47c52afc7e2d75e5af90844f161c5c5cbe2972ac1195ab576f999a6
|
| 3 |
+
size 1492
|
global_step_110/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41b4e147b6d16906c9cfb2b39b9bdd4f75146f0a248ea0193454f81831e76bb4
|
| 3 |
+
size 1492
|
global_step_120/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0923213f5bc69f840c724b48d54a96a74c280bf924321eda7a5367e1cf6b4e3
|
| 3 |
+
size 1492
|
global_step_130/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c5a2632e8a841943aac0f0be2b334f4646035c65d1240d66864082eef2d401a4
|
| 3 |
+
size 1492
|
global_step_140/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d01484d6d09eccd8b9e3f43ded14211bbf555b505fc9cac08b24078ed9e27d0
|
| 3 |
+
size 1492
|
global_step_150/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:63d28b7ad26ac8173d552639da2317a6cdeb15cd3d165f9d3481a0836a0d50a8
|
| 3 |
+
size 1492
|
global_step_160/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40c16c89c7e17c285a71307b956f303d8131868a85534719c6f3535051c6e513
|
| 3 |
+
size 1492
|
global_step_170/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b1da1afdaf857aedda5156c314fb02caebf294c914408bdda5ebd8c265855ff
|
| 3 |
+
size 1492
|
global_step_180/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32ff8a4eaf4da58e606e329c0fd94b6f1a4b0840ac231216d6bc44c380cd707d
|
| 3 |
+
size 1492
|
global_step_190/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0bd9f2258a308c5ece66e363fc6484b3cb6826c672b3fd4acdc7b6e49f461ad
|
| 3 |
+
size 1492
|
global_step_20/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c25d7406469166649279d20b3414fe1ea78e6f46fbbf17d838f1d53ae281c6aa
|
| 3 |
+
size 1492
|
global_step_200/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:36e7177eca2e2ca560bec9dd93597e359cca2c17dd7b10906fc7f647179a150c
|
| 3 |
+
size 1492
|
global_step_210/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:780923f2542051db399881e3da91cff9e9573f4b199570e5fe6dfd6240777125
|
| 3 |
+
size 1492
|
global_step_220/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d711299389da17f156e270c7f7ed5fdf27008179afc08f6aa0889e57d7a12533
|
| 3 |
+
size 1492
|
global_step_230/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99cfdaabc6cd3d66b52ca52068a4b697ee40389d4c4c50f10680be20f39ef14b
|
| 3 |
+
size 1492
|
global_step_240/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3cf9179c66cef966dc1af0bdbda417a06d6f5817de5ff1de64c931d725d39bf9
|
| 3 |
+
size 1492
|
global_step_250/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7564b3ab5f895159f11f932c2eee4872ef5c361e400837d40d864b5ad59a1028
|
| 3 |
+
size 1492
|
global_step_260/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bee533964194a4384efb4d7dc61934306240afce40624d1a59d988dd98d8b37c
|
| 3 |
+
size 1556
|
global_step_270/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a1a40df593590b16688d2fefad7a4863df0ac714d07c46dd551beb3c3802a5a
|
| 3 |
+
size 1556
|
global_step_280/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9cb6bfadfbba33c6a3fe4d6d8f8f5c1571ec75a57aabf57492732350372cd5f8
|
| 3 |
+
size 1556
|
global_step_290/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a94eb0534e6d87e0c90357598ab7d49cea9bf589c4e55893fa90dc6210328ff
|
| 3 |
+
size 1556
|
global_step_30/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ad84e82194e899d898db098bd3c3fd3168c3b6de92d20ded3f74c1b8f2c2d39
|
| 3 |
+
size 1492
|
global_step_300/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e2c789872541dd8f8118186a6553fc8a2c47d2254cf369285340ca4e125f27f8
|
| 3 |
+
size 1556
|
global_step_310/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:29b810c610fa09a3bc8ab4cbce64a6fa0a4ce49ce5e2b37d049368e9e7bde3f0
|
| 3 |
+
size 1556
|
global_step_320/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7604f66e6c2445b98f3eb98c87d3591f3a2d2716abf760aff727811bf24801fb
|
| 3 |
+
size 1556
|
global_step_330/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5be7f2e8ae24339c2d7f0dc5b70c98c64931ae00b1ea3e2939d024a8f327f8e3
|
| 3 |
+
size 1556
|
global_step_340/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0156a13255c7584e40fd403c638b91c7fde59e8bdb5a632d19cf15ee9c131e1e
|
| 3 |
+
size 1556
|
global_step_350/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c559e9fd82fb38b02bc8f6293ad797b6862ebb53ef37ce152490f41516ed799
|
| 3 |
+
size 1556
|
global_step_360/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14b003ce8c0a604d61456cd255b7ccfc4b2a914c53a3ffd77d3c65d902d63926
|
| 3 |
+
size 1556
|
global_step_370/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e903937cd25bf088396e3c5329a8a5181d1fb4da007aea7754ace4911c97dc4a
|
| 3 |
+
size 1556
|
global_step_380/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8043cee8945a3c94060974339e716f23bb5ff26320ed8e2bd4390dd42f8beae1
|
| 3 |
+
size 1556
|
global_step_390/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c9d99e4d4cf579a06151a4a5ed5863330a0991c67ad46d354de963e83512af3
|
| 3 |
+
size 1556
|
global_step_40/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:628d93cadd40a5284c1e913ee41a8f47d1898d4f5fc4fc7ad6de5ec486a8c601
|
| 3 |
+
size 1492
|
global_step_400/data.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2052811d10bc639e35afc2a9c744ac5ecc26b4c303883b368274d1e20ab0fd2b
|
| 3 |
+
size 1556
|
global_step_410/actor/extra_state_world_size_8_rank_0.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05b3ba55c9ab6f3006692a7c6183587902010dfd80b4ec0dde50c9a56f489b20
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_1.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:936d9887d3ff3688cc3a2ea9298b8ca0531f83b612463829b9dee248647925d6
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_2.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:408538fda8acacabcdec600c3b52d58f33fc116146fdfff08ad8dad398f2c7dc
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_3.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2da863bf61902e45b320b63a58adebeda67a457be79b67057d0e53591ac9f89
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_4.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cecd819e59aee6a4a807036b2067ac751192cf69b917a5a598adb6c2bc67651b
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_5.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97b4f0ec301ea549313d6f189a6078cc8e76af2155a10640ff7349f6710521f7
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_6.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:637234e33bd402a548e946634ebe04fd7f62954964ee7fe36933221d2fdab47c
|
| 3 |
+
size 14632
|
global_step_410/actor/extra_state_world_size_8_rank_7.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b18f4e1215deeeab897b1128842ca688e1bc80566906e3b5834f2445d60675f4
|
| 3 |
+
size 14632
|
global_step_410/actor/fsdp_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"FSDP_version": 1,
|
| 3 |
+
"world_size": 8
|
| 4 |
+
}
|
global_step_410/actor/huggingface/added_tokens.json
ADDED
|
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"</tool_call>": 151658,
|
| 3 |
+
"<tool_call>": 151657,
|
| 4 |
+
"<|box_end|>": 151649,
|
| 5 |
+
"<|box_start|>": 151648,
|
| 6 |
+
"<|endoftext|>": 151643,
|
| 7 |
+
"<|file_sep|>": 151664,
|
| 8 |
+
"<|fim_middle|>": 151660,
|
| 9 |
+
"<|fim_pad|>": 151662,
|
| 10 |
+
"<|fim_prefix|>": 151659,
|
| 11 |
+
"<|fim_suffix|>": 151661,
|
| 12 |
+
"<|im_end|>": 151645,
|
| 13 |
+
"<|im_start|>": 151644,
|
| 14 |
+
"<|image_pad|>": 151655,
|
| 15 |
+
"<|object_ref_end|>": 151647,
|
| 16 |
+
"<|object_ref_start|>": 151646,
|
| 17 |
+
"<|quad_end|>": 151651,
|
| 18 |
+
"<|quad_start|>": 151650,
|
| 19 |
+
"<|repo_name|>": 151663,
|
| 20 |
+
"<|video_pad|>": 151656,
|
| 21 |
+
"<|vision_end|>": 151653,
|
| 22 |
+
"<|vision_pad|>": 151654,
|
| 23 |
+
"<|vision_start|>": 151652
|
| 24 |
+
}
|
global_step_410/actor/huggingface/config.json
ADDED
|
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_attn_implementation_autoset": true,
|
| 3 |
+
"architectures": [
|
| 4 |
+
"Qwen2ForCausalLM"
|
| 5 |
+
],
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"eos_token_id": 151643,
|
| 8 |
+
"hidden_act": "silu",
|
| 9 |
+
"hidden_size": 1536,
|
| 10 |
+
"initializer_range": 0.02,
|
| 11 |
+
"intermediate_size": 8960,
|
| 12 |
+
"max_position_embeddings": 4096,
|
| 13 |
+
"max_window_layers": 21,
|
| 14 |
+
"model_type": "qwen2",
|
| 15 |
+
"num_attention_heads": 12,
|
| 16 |
+
"num_hidden_layers": 28,
|
| 17 |
+
"num_key_value_heads": 2,
|
| 18 |
+
"pad_token_id": 151643,
|
| 19 |
+
"rms_norm_eps": 1e-06,
|
| 20 |
+
"rope_scaling": null,
|
| 21 |
+
"rope_theta": 10000,
|
| 22 |
+
"sliding_window": 4096,
|
| 23 |
+
"tie_word_embeddings": true,
|
| 24 |
+
"torch_dtype": "float32",
|
| 25 |
+
"transformers_version": "4.51.1",
|
| 26 |
+
"use_cache": true,
|
| 27 |
+
"use_mrope": false,
|
| 28 |
+
"use_sliding_window": false,
|
| 29 |
+
"vocab_size": 151936
|
| 30 |
+
}
|
global_step_410/actor/huggingface/generation_config.json
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token_id": 151643,
|
| 3 |
+
"eos_token_id": 151643,
|
| 4 |
+
"max_new_tokens": 2048,
|
| 5 |
+
"transformers_version": "4.51.1"
|
| 6 |
+
}
|
global_step_410/actor/huggingface/merges.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
global_step_410/actor/huggingface/special_tokens_map.json
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"additional_special_tokens": [
|
| 3 |
+
"<|im_start|>",
|
| 4 |
+
"<|im_end|>",
|
| 5 |
+
"<|object_ref_start|>",
|
| 6 |
+
"<|object_ref_end|>",
|
| 7 |
+
"<|box_start|>",
|
| 8 |
+
"<|box_end|>",
|
| 9 |
+
"<|quad_start|>",
|
| 10 |
+
"<|quad_end|>",
|
| 11 |
+
"<|vision_start|>",
|
| 12 |
+
"<|vision_end|>",
|
| 13 |
+
"<|vision_pad|>",
|
| 14 |
+
"<|image_pad|>",
|
| 15 |
+
"<|video_pad|>"
|
| 16 |
+
],
|
| 17 |
+
"eos_token": {
|
| 18 |
+
"content": "<|endoftext|>",
|
| 19 |
+
"lstrip": false,
|
| 20 |
+
"normalized": false,
|
| 21 |
+
"rstrip": false,
|
| 22 |
+
"single_word": false
|
| 23 |
+
},
|
| 24 |
+
"pad_token": {
|
| 25 |
+
"content": "<|endoftext|>",
|
| 26 |
+
"lstrip": false,
|
| 27 |
+
"normalized": false,
|
| 28 |
+
"rstrip": false,
|
| 29 |
+
"single_word": false
|
| 30 |
+
}
|
| 31 |
+
}
|