riczhou commited on
Commit
58af6b1
·
verified ·
1 Parent(s): 87e8b1c

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3",
4
+ "quantization": "q4f32_1",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 5120,
8
+ "intermediate_size": 25600,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 64,
11
+ "num_hidden_layers": 64,
12
+ "num_key_value_heads": 8,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128
23
+ },
24
+ "vocab_size": 151936,
25
+ "context_window_size": 40960,
26
+ "sliding_window_size": -1,
27
+ "prefill_chunk_size": 2048,
28
+ "attention_sink_size": -1,
29
+ "tensor_parallel_shards": 1,
30
+ "pipeline_parallel_stages": 1,
31
+ "temperature": 0.6,
32
+ "presence_penalty": 0.0,
33
+ "frequency_penalty": 0.0,
34
+ "repetition_penalty": 1.0,
35
+ "top_p": 0.95,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "vocab.json",
39
+ "merges.txt",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_level",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "qwen2",
49
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "You are a helpful assistant.",
51
+ "system_prefix_token_ids": null,
52
+ "add_role_after_system_message": true,
53
+ "roles": {
54
+ "user": "<|im_start|>user",
55
+ "assistant": "<|im_start|>assistant"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ "<|im_end|>\n"
65
+ ],
66
+ "role_content_sep": "\n",
67
+ "role_empty_sep": "\n",
68
+ "stop_str": [
69
+ "<|endoftext|>",
70
+ "<|im_end|>"
71
+ ],
72
+ "stop_token_ids": [
73
+ 151643,
74
+ 151645
75
+ ],
76
+ "function_string": "",
77
+ "use_function_calling": false
78
+ },
79
+ "pad_token_id": 151643,
80
+ "bos_token_id": 151643,
81
+ "eos_token_id": [
82
+ 151645,
83
+ 151643
84
+ ]
85
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de9c1b38202e2b2dce44a5174c75e802d325fd67012370a2f5d74ef56faad3e2
3
+ size 388956160
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c1d3818d9ccd0aa766da1aa31a6621fb322a8dcfe1675656b882bcbf4cf5b96
3
+ size 48619520
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94b4ca9032884ba7543f9dc30a441945b8031f4edb570fcd3ecbde2ee9bef18e
3
+ size 48619520
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bc63765d8beaeb99d3c4e512dba8cd6b9d84aee038e91baa7f94247d20eb7ca
3
+ size 131072000
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4214fe95b1be90af70a9d26537510bcfa014c142f8c7e32523c48d2de8bf636
3
+ size 26214400
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:480c60b6582667ea5b542544deac1e5bd18688945474e732a69dfb9c40211a6f
3
+ size 20971520
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0249121a8799b12607efe64df45da67f4346d6fae214f8f4911d589a951af0db
3
+ size 131072000
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d047044bb8852b3603609510057bbc2111181d8a3f041ebf557c0fe7bf136c5
3
+ size 30484992
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1680bc1b1f8a0362fdf6a63e93d3260b6b23f7401e3bd7c602abad0c81d88258
3
+ size 26214400
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ef3accb593e47d27a8a27dd433c21b46e81c09328729aa8fff7166bab47cc53
3
+ size 20971520
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:824314c02feb13b41cb6b01d18e034bb3bd03f7e6319fae291a426b4cc310e05
3
+ size 65536000
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1895389f43c933f6ba0c3c5d9dd2db597b19a611e933f905842b9369452d8e8
3
+ size 65536000
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77c5db225b3d78b43a9f0be7e9149182410dbe93598cfc83c536e9b164d6da1e
3
+ size 30505472
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d83a5092f69e51bb6c33d1f0976c567cffe3accd1443e8526dd8fc7b112cea82
3
+ size 65536000
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1ab6222d240fbc14c34e9dc14c3372d0e45a237386290e49b198abd53ed5c5f
3
+ size 131072000
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ab6a61b39dbe43d0ac7d3eea29bf132a4b606ee4d5968d086e73c411b63f0e0
3
+ size 26214400
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2509b70b6cd216753aaba10a1a9ca1f638a318f0c7de1b4ee77424c44fc837e6
3
+ size 20971520
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f646d7ffd163f919d14ac3ac01795d9671398700d335dccdc8e35673fa2ff9b
3
+ size 65536000
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:206b8ec2f55d1c34d695d0b2f9872242f5a453e9aa4a19981c0ae47c23fc9bf4
3
+ size 30495232
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aff3ea0d74f28cf00e2f5c3b8a01d655f2f5125ab80ded1e880df8d8c4820ca8
3
+ size 131072000
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8ec53142450fc1b72bdda2f3f2f8418c5fbcf78c4a13242acbb5a01b909e9fa
3
+ size 26214400
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2021e52dbb074221b30780adc6c0de3103c4047ea20822dfb146ecd1f42c8d6c
3
+ size 20971520
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44b98bd90cc1ebb502aed1dbfaa643436eb89128c1f4eeaedb54406787247b8e
3
+ size 65536000
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33e1c6920cb5fcb221127a60edf61ad988632e3ff8d38232df1c25d9cdf1b3d4
3
+ size 30495232
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a91a7f350d1d2f46c9667766d3f1b3da04c106ceaa62d4cbed1ef0b27b79bed5
3
+ size 131072000
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bbdfcddea30d4cdd2b49b0276aa1d8e7972a663e0d1d5759f62ab41964c5ad5
3
+ size 131072000
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a10fbc7ecdd1f89b2257bb9f1b9e4287c48cd357d5f92caafc74bb4a67bd73f5
3
+ size 26214400
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1adc46c9ca2735834ec9c564c0913b9c8cc10125f326524b22e105e8cd22801
3
+ size 20971520
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fb042ac5a428d911bf69920c1cdb789ffc3ec7b451b18dae5c2f581170d8022
3
+ size 26214400
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb3b11cd69b6d031b444a54ad05ded84127463b11f445e215e6a7ff2fe9f6cb5
3
+ size 30485248
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5eede4b2db99ad5afcb7f7432aeac869d127a4add75a5b2c6bdbad288712074b
3
+ size 65536000
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:913e295a30ac7a7a715c9a22b07bf25660b32c7a03f66eb0554949f563a63255
3
+ size 26880256
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67e183dbb55c9f33fef062640561741efee68bd6b9d9261a9a7b2bec0b5485c9
3
+ size 65536000
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f79f5f2f6994eb0869d20eb17b515bab2f6668a39c96b73d0f23ec71f3f5116d
3
+ size 131072000
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e997351f19f3a162f99d421aabe9ac8bf97dde04331dadad18cb269ce34caff8
3
+ size 26214400
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab29825519c2ad39def125bd467a4b6eb966143adf0b6982f9b8f4a3f493b20c
3
+ size 30505472
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd942867ec168461cffa22470eb4e80a56700e2e78c70c84c3dd84ac5f74b99b
3
+ size 32798976
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73cae19bcc11610ea5084c7cbe29ba97d896b11d18fa5f9b303705727d0b53f0
3
+ size 65536000
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b9071b1861cab1ba888da08efe711065940e91d1ec4a79d2d78a004970ce267
3
+ size 26880256
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b9ef8d0d5c21659536542feac25c714a0ccbd4abf272b64763d64ee52b6431c
3
+ size 131072000
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f4b9091f4fc7a71e8fde9dbcef5bf704f6e9a1778cd58cb619a64e52de535d4
3
+ size 26214400
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a1a4a3afc0a964aa35fc4b826738662f75c1deff3ae28f624b5948a4c763fbd
3
+ size 20971520
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22f56d2ab61f9f138eee34ce70f0cd7d1e05ba410391ad1edc197cf2e34cf834
3
+ size 65536000
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bca1158889b353bdb36062f05a130547ef55bc69307c24ee464d4cff2fbf699
3
+ size 30495232
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aef2ded280d40e0a392133efe113ad32bc192d21bd1561e67c7c71b4fc119302
3
+ size 131072000