re-upload using new tokenizer
Browse files- config.json +2 -2
- generation_config.json +1 -1
- model-00001-of-00002.safetensors +1 -1
- tokenizer.json +7 -6
- tokenizer_config.json +6 -6
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "/home/ubuntu/.cache/huggingface/hub/models--NousResearch--Hermes-2-Pro-Llama-3-8B/snapshots/
|
| 3 |
"architectures": [
|
| 4 |
"LlamaForCausalLM"
|
| 5 |
],
|
|
@@ -30,7 +30,7 @@
|
|
| 30 |
"rope_theta": 500000.0,
|
| 31 |
"tie_word_embeddings": false,
|
| 32 |
"torch_dtype": "float16",
|
| 33 |
-
"transformers_version": "4.
|
| 34 |
"use_cache": false,
|
| 35 |
"vocab_size": 128288
|
| 36 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "/home/ubuntu/.cache/huggingface/hub/models--NousResearch--Hermes-2-Pro-Llama-3-8B/snapshots/7c94b9e1248071b53e8b303893a51feb811dcc2c",
|
| 3 |
"architectures": [
|
| 4 |
"LlamaForCausalLM"
|
| 5 |
],
|
|
|
|
| 30 |
"rope_theta": 500000.0,
|
| 31 |
"tie_word_embeddings": false,
|
| 32 |
"torch_dtype": "float16",
|
| 33 |
+
"transformers_version": "4.40.1",
|
| 34 |
"use_cache": false,
|
| 35 |
"vocab_size": 128288
|
| 36 |
}
|
generation_config.json
CHANGED
|
@@ -3,5 +3,5 @@
|
|
| 3 |
"bos_token_id": 128000,
|
| 4 |
"do_sample": true,
|
| 5 |
"eos_token_id": 128003,
|
| 6 |
-
"transformers_version": "4.
|
| 7 |
}
|
|
|
|
| 3 |
"bos_token_id": 128000,
|
| 4 |
"do_sample": true,
|
| 5 |
"eos_token_id": 128003,
|
| 6 |
+
"transformers_version": "4.40.1"
|
| 7 |
}
|
model-00001-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4677527440
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9f440c275e5870e69dae71d1d4e72de52d14f35ff5ebcc16fe09f7b6cdecda6
|
| 3 |
size 4677527440
|
tokenizer.json
CHANGED
|
@@ -46,7 +46,7 @@
|
|
| 46 |
"lstrip": false,
|
| 47 |
"rstrip": false,
|
| 48 |
"normalized": false,
|
| 49 |
-
"special":
|
| 50 |
},
|
| 51 |
{
|
| 52 |
"id": 128005,
|
|
@@ -55,7 +55,7 @@
|
|
| 55 |
"lstrip": false,
|
| 56 |
"rstrip": false,
|
| 57 |
"normalized": false,
|
| 58 |
-
"special":
|
| 59 |
},
|
| 60 |
{
|
| 61 |
"id": 128006,
|
|
@@ -82,7 +82,7 @@
|
|
| 82 |
"lstrip": false,
|
| 83 |
"rstrip": false,
|
| 84 |
"normalized": false,
|
| 85 |
-
"special":
|
| 86 |
},
|
| 87 |
{
|
| 88 |
"id": 128009,
|
|
@@ -100,7 +100,7 @@
|
|
| 100 |
"lstrip": false,
|
| 101 |
"rstrip": false,
|
| 102 |
"normalized": false,
|
| 103 |
-
"special":
|
| 104 |
},
|
| 105 |
{
|
| 106 |
"id": 128011,
|
|
@@ -109,7 +109,7 @@
|
|
| 109 |
"lstrip": false,
|
| 110 |
"rstrip": false,
|
| 111 |
"normalized": false,
|
| 112 |
-
"special":
|
| 113 |
},
|
| 114 |
{
|
| 115 |
"id": 128012,
|
|
@@ -118,7 +118,7 @@
|
|
| 118 |
"lstrip": false,
|
| 119 |
"rstrip": false,
|
| 120 |
"normalized": false,
|
| 121 |
-
"special":
|
| 122 |
},
|
| 123 |
{
|
| 124 |
"id": 128013,
|
|
@@ -2695,6 +2695,7 @@
|
|
| 2695 |
"end_of_word_suffix": null,
|
| 2696 |
"fuse_unk": false,
|
| 2697 |
"byte_fallback": false,
|
|
|
|
| 2698 |
"vocab": {
|
| 2699 |
"!": 0,
|
| 2700 |
"\"": 1,
|
|
|
|
| 46 |
"lstrip": false,
|
| 47 |
"rstrip": false,
|
| 48 |
"normalized": false,
|
| 49 |
+
"special": false
|
| 50 |
},
|
| 51 |
{
|
| 52 |
"id": 128005,
|
|
|
|
| 55 |
"lstrip": false,
|
| 56 |
"rstrip": false,
|
| 57 |
"normalized": false,
|
| 58 |
+
"special": false
|
| 59 |
},
|
| 60 |
{
|
| 61 |
"id": 128006,
|
|
|
|
| 82 |
"lstrip": false,
|
| 83 |
"rstrip": false,
|
| 84 |
"normalized": false,
|
| 85 |
+
"special": false
|
| 86 |
},
|
| 87 |
{
|
| 88 |
"id": 128009,
|
|
|
|
| 100 |
"lstrip": false,
|
| 101 |
"rstrip": false,
|
| 102 |
"normalized": false,
|
| 103 |
+
"special": false
|
| 104 |
},
|
| 105 |
{
|
| 106 |
"id": 128011,
|
|
|
|
| 109 |
"lstrip": false,
|
| 110 |
"rstrip": false,
|
| 111 |
"normalized": false,
|
| 112 |
+
"special": false
|
| 113 |
},
|
| 114 |
{
|
| 115 |
"id": 128012,
|
|
|
|
| 118 |
"lstrip": false,
|
| 119 |
"rstrip": false,
|
| 120 |
"normalized": false,
|
| 121 |
+
"special": false
|
| 122 |
},
|
| 123 |
{
|
| 124 |
"id": 128013,
|
|
|
|
| 2695 |
"end_of_word_suffix": null,
|
| 2696 |
"fuse_unk": false,
|
| 2697 |
"byte_fallback": false,
|
| 2698 |
+
"ignore_merges": true,
|
| 2699 |
"vocab": {
|
| 2700 |
"!": 0,
|
| 2701 |
"\"": 1,
|
tokenizer_config.json
CHANGED
|
@@ -38,7 +38,7 @@
|
|
| 38 |
"normalized": false,
|
| 39 |
"rstrip": false,
|
| 40 |
"single_word": false,
|
| 41 |
-
"special":
|
| 42 |
},
|
| 43 |
"128005": {
|
| 44 |
"content": "<tool_response>",
|
|
@@ -46,7 +46,7 @@
|
|
| 46 |
"normalized": false,
|
| 47 |
"rstrip": false,
|
| 48 |
"single_word": false,
|
| 49 |
-
"special":
|
| 50 |
},
|
| 51 |
"128006": {
|
| 52 |
"content": "<|start_header_id|>",
|
|
@@ -70,7 +70,7 @@
|
|
| 70 |
"normalized": false,
|
| 71 |
"rstrip": false,
|
| 72 |
"single_word": false,
|
| 73 |
-
"special":
|
| 74 |
},
|
| 75 |
"128009": {
|
| 76 |
"content": "<|eot_id>",
|
|
@@ -86,7 +86,7 @@
|
|
| 86 |
"normalized": false,
|
| 87 |
"rstrip": false,
|
| 88 |
"single_word": false,
|
| 89 |
-
"special":
|
| 90 |
},
|
| 91 |
"128011": {
|
| 92 |
"content": "</tool_call>",
|
|
@@ -94,7 +94,7 @@
|
|
| 94 |
"normalized": false,
|
| 95 |
"rstrip": false,
|
| 96 |
"single_word": false,
|
| 97 |
-
"special":
|
| 98 |
},
|
| 99 |
"128012": {
|
| 100 |
"content": "</tool_response>",
|
|
@@ -102,7 +102,7 @@
|
|
| 102 |
"normalized": false,
|
| 103 |
"rstrip": false,
|
| 104 |
"single_word": false,
|
| 105 |
-
"special":
|
| 106 |
},
|
| 107 |
"128013": {
|
| 108 |
"content": "<|reserved_special_token_8|>",
|
|
|
|
| 38 |
"normalized": false,
|
| 39 |
"rstrip": false,
|
| 40 |
"single_word": false,
|
| 41 |
+
"special": false
|
| 42 |
},
|
| 43 |
"128005": {
|
| 44 |
"content": "<tool_response>",
|
|
|
|
| 46 |
"normalized": false,
|
| 47 |
"rstrip": false,
|
| 48 |
"single_word": false,
|
| 49 |
+
"special": false
|
| 50 |
},
|
| 51 |
"128006": {
|
| 52 |
"content": "<|start_header_id|>",
|
|
|
|
| 70 |
"normalized": false,
|
| 71 |
"rstrip": false,
|
| 72 |
"single_word": false,
|
| 73 |
+
"special": false
|
| 74 |
},
|
| 75 |
"128009": {
|
| 76 |
"content": "<|eot_id>",
|
|
|
|
| 86 |
"normalized": false,
|
| 87 |
"rstrip": false,
|
| 88 |
"single_word": false,
|
| 89 |
+
"special": false
|
| 90 |
},
|
| 91 |
"128011": {
|
| 92 |
"content": "</tool_call>",
|
|
|
|
| 94 |
"normalized": false,
|
| 95 |
"rstrip": false,
|
| 96 |
"single_word": false,
|
| 97 |
+
"special": false
|
| 98 |
},
|
| 99 |
"128012": {
|
| 100 |
"content": "</tool_response>",
|
|
|
|
| 102 |
"normalized": false,
|
| 103 |
"rstrip": false,
|
| 104 |
"single_word": false,
|
| 105 |
+
"special": false
|
| 106 |
},
|
| 107 |
"128013": {
|
| 108 |
"content": "<|reserved_special_token_8|>",
|