Add files using upload-large-folder tool
Browse files- LICENSE +21 -0
- config.json +66 -0
- generation_config.json +9 -0
- model-00095-of-000163.safetensors +3 -0
- model-00096-of-000163.safetensors +3 -0
- model-00097-of-000163.safetensors +3 -0
- model-00098-of-000163.safetensors +3 -0
- model-00099-of-000163.safetensors +3 -0
- model-00101-of-000163.safetensors +3 -0
- model-00102-of-000163.safetensors +3 -0
- model-00103-of-000163.safetensors +3 -0
- model-00104-of-000163.safetensors +3 -0
- model-00105-of-000163.safetensors +3 -0
- model-00106-of-000163.safetensors +3 -0
- model-00107-of-000163.safetensors +3 -0
- model-00108-of-000163.safetensors +3 -0
- model-00109-of-000163.safetensors +3 -0
- model-00110-of-000163.safetensors +3 -0
- model-00111-of-000163.safetensors +3 -0
- model-00112-of-000163.safetensors +3 -0
- model-00113-of-000163.safetensors +3 -0
- model-00114-of-000163.safetensors +3 -0
- model-00115-of-000163.safetensors +3 -0
- model-00116-of-000163.safetensors +3 -0
- model-00117-of-000163.safetensors +3 -0
- model-00118-of-000163.safetensors +3 -0
- model-00119-of-000163.safetensors +3 -0
- model-00120-of-000163.safetensors +3 -0
- model-00122-of-000163.safetensors +3 -0
- model-00146-of-000163.safetensors +3 -0
- model-00147-of-000163.safetensors +3 -0
- model-00148-of-000163.safetensors +3 -0
- model-00149-of-000163.safetensors +3 -0
- model-00150-of-000163.safetensors +3 -0
- model-00151-of-000163.safetensors +3 -0
- model-00152-of-000163.safetensors +3 -0
- model-00153-of-000163.safetensors +3 -0
- model-00154-of-000163.safetensors +3 -0
- model-00155-of-000163.safetensors +3 -0
- model-00156-of-000163.safetensors +3 -0
- model-00157-of-000163.safetensors +3 -0
- model-00158-of-000163.safetensors +3 -0
- model-00159-of-000163.safetensors +3 -0
- model-00160-of-000163.safetensors +3 -0
- model-00161-of-000163.safetensors +3 -0
- model-00162-of-000163.safetensors +3 -0
- model-00163-of-000163.safetensors +3 -0
- model.safetensors.index.json +0 -0
- tokenizer.json +0 -0
- tokenizer_config.json +35 -0
LICENSE
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
MIT License
|
| 2 |
+
|
| 3 |
+
Copyright (c) 2023 DeepSeek
|
| 4 |
+
|
| 5 |
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
| 6 |
+
of this software and associated documentation files (the "Software"), to deal
|
| 7 |
+
in the Software without restriction, including without limitation the rights
|
| 8 |
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
| 9 |
+
copies of the Software, and to permit persons to whom the Software is
|
| 10 |
+
furnished to do so, subject to the following conditions:
|
| 11 |
+
|
| 12 |
+
The above copyright notice and this permission notice shall be included in all
|
| 13 |
+
copies or substantial portions of the Software.
|
| 14 |
+
|
| 15 |
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
| 16 |
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
| 17 |
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
| 18 |
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
| 19 |
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
| 20 |
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
| 21 |
+
SOFTWARE.
|
config.json
ADDED
|
@@ -0,0 +1,66 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"DeepseekV32ForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_bias": false,
|
| 6 |
+
"attention_dropout": 0.0,
|
| 7 |
+
"bos_token_id": 0,
|
| 8 |
+
"eos_token_id": 1,
|
| 9 |
+
"ep_size": 1,
|
| 10 |
+
"first_k_dense_replace": 3,
|
| 11 |
+
"hidden_act": "silu",
|
| 12 |
+
"hidden_size": 7168,
|
| 13 |
+
"index_head_dim": 128,
|
| 14 |
+
"index_n_heads": 64,
|
| 15 |
+
"index_topk": 2048,
|
| 16 |
+
"initializer_range": 0.02,
|
| 17 |
+
"intermediate_size": 18432,
|
| 18 |
+
"kv_lora_rank": 512,
|
| 19 |
+
"max_position_embeddings": 163840,
|
| 20 |
+
"model_type": "deepseek_v32",
|
| 21 |
+
"moe_intermediate_size": 2048,
|
| 22 |
+
"moe_layer_freq": 1,
|
| 23 |
+
"n_group": 8,
|
| 24 |
+
"n_routed_experts": 256,
|
| 25 |
+
"n_shared_experts": 1,
|
| 26 |
+
"norm_topk_prob": true,
|
| 27 |
+
"num_attention_heads": 128,
|
| 28 |
+
"num_experts_per_tok": 8,
|
| 29 |
+
"num_hidden_layers": 61,
|
| 30 |
+
"num_key_value_heads": 128,
|
| 31 |
+
"num_nextn_predict_layers": 1,
|
| 32 |
+
"q_lora_rank": 1536,
|
| 33 |
+
"qk_nope_head_dim": 128,
|
| 34 |
+
"qk_rope_head_dim": 64,
|
| 35 |
+
"quantization_config": {
|
| 36 |
+
"activation_scheme": "dynamic",
|
| 37 |
+
"fmt": "e4m3",
|
| 38 |
+
"quant_method": "fp8",
|
| 39 |
+
"scale_fmt": "ue8m0",
|
| 40 |
+
"weight_block_size": [
|
| 41 |
+
128,
|
| 42 |
+
128
|
| 43 |
+
]
|
| 44 |
+
},
|
| 45 |
+
"rms_norm_eps": 1e-06,
|
| 46 |
+
"rope_scaling": {
|
| 47 |
+
"beta_fast": 32,
|
| 48 |
+
"beta_slow": 1,
|
| 49 |
+
"factor": 40,
|
| 50 |
+
"mscale": 1.0,
|
| 51 |
+
"mscale_all_dim": 1.0,
|
| 52 |
+
"original_max_position_embeddings": 4096,
|
| 53 |
+
"type": "yarn"
|
| 54 |
+
},
|
| 55 |
+
"rope_theta": 10000,
|
| 56 |
+
"routed_scaling_factor": 2.5,
|
| 57 |
+
"scoring_func": "sigmoid",
|
| 58 |
+
"tie_word_embeddings": false,
|
| 59 |
+
"topk_group": 4,
|
| 60 |
+
"topk_method": "noaux_tc",
|
| 61 |
+
"torch_dtype": "bfloat16",
|
| 62 |
+
"transformers_version": "4.44.2",
|
| 63 |
+
"use_cache": true,
|
| 64 |
+
"v_head_dim": 128,
|
| 65 |
+
"vocab_size": 129280
|
| 66 |
+
}
|
generation_config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_from_model_config": true,
|
| 3 |
+
"bos_token_id": 0,
|
| 4 |
+
"eos_token_id": 1,
|
| 5 |
+
"do_sample": true,
|
| 6 |
+
"temperature": 0.6,
|
| 7 |
+
"top_p": 0.95,
|
| 8 |
+
"transformers_version": "4.46.3"
|
| 9 |
+
}
|
model-00095-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a37ee841ceb5d6da6b3ea603ea533512bba44db380be644ad37faeb3af231d85
|
| 3 |
+
size 4302122420
|
model-00096-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b75e03171a1ea8a44c25ffbb6abaeb1e473763426dce746c03dba1d031a7c57
|
| 3 |
+
size 4302384870
|
model-00097-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80cf1a489771466e336d2306321cde173454f0ab67f7341653df8268968a1fed
|
| 3 |
+
size 4302122808
|
model-00098-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01c6a93a211061641df5949379a2eb38beff7c7285f2900ce119d6d42b55bcbf
|
| 3 |
+
size 4302384470
|
model-00099-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f6ff76f49c885bc2d076783178c69f357b5d7c8b5d2d1f1e9b30e06aefbf1806
|
| 3 |
+
size 4302384963
|
model-00101-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a038df3227b3b88baeb35f1a2814e8fc22bcda04235a63526ddf1162da8c8d5
|
| 3 |
+
size 4302061105
|
model-00102-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df033187bb10076a2eb32273af0eb5a89eedd7c65db2ae64449830bdc55312b2
|
| 3 |
+
size 4302384914
|
model-00103-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1c4cb7b3a81e8fa3b46c5f9cba2a97b769f4c82c2005610c21a04b4b6e9362d
|
| 3 |
+
size 4302122764
|
model-00104-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:039416f75c5f9b01ea7706a4578c10b36d2bd65d0ae647551b42d3ee09419022
|
| 3 |
+
size 4302384516
|
model-00105-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ea44f0fc9a60890ef49541a96cde1351e9867c97978be60dd24bbc8649c90ab
|
| 3 |
+
size 4302384961
|
model-00106-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9085297b817cabca6d30f2002772258952778469eccce0c3053bed548843f94b
|
| 3 |
+
size 4302122576
|
model-00107-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0a80d0cf72d7eb6f9002786885706d6f9a565449deae8d682bde813fd801972
|
| 3 |
+
size 4302384704
|
model-00108-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:33a2bfbe5e40e513f5f98e66e85318adc54348a4656aee8b300f8972fedd814d
|
| 3 |
+
size 4302384963
|
model-00109-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c045b68d8767915b8ca516304fecb1d2ff713cd30b20a73926c120523504a4ab
|
| 3 |
+
size 4302122398
|
model-00110-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a611de6a11d5ca9eab967d49212acc26e77f63846a904bdd1a3178119359cbf
|
| 3 |
+
size 4302384890
|
model-00111-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41b8aaf89940143283be411080e7129d8556d52189a257a28e3cc97b0b130b3b
|
| 3 |
+
size 4302122786
|
model-00112-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea85fa7d9437dc9ea529b89b96f9078ca3662e8abd659efb91266f7fde59436c
|
| 3 |
+
size 4302384494
|
model-00113-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:99dac612f57573d63ade18771b23caec5912ca067d8ae830f0f3e3d6c4e6b698
|
| 3 |
+
size 4302384963
|
model-00114-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf4263cf035ff57647c11c988026a48043dc88323c734fd51a10368ec18f9848
|
| 3 |
+
size 4302122598
|
model-00115-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:65a149f38c6f3daeb302ceee54ce3664255b5822a0dd40ed5c6a62d70ea2d388
|
| 3 |
+
size 4302384680
|
model-00116-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd260bd3f39e5aa90609819cff07263c91ad0a2f4f1cb4a57f94cbacdf4d007d
|
| 3 |
+
size 4302384963
|
model-00117-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9dadc62b182fd6577697bd89544c6c0097ac5b46f059a6730ec0b0fc98fa7242
|
| 3 |
+
size 4302122420
|
model-00118-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d711b22702f5fd27074a82ba298296bf6127b860b18a2024435be99fc0986fde
|
| 3 |
+
size 4302384870
|
model-00119-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1fcd13b9fe958ac6d8865434b58aaadb3fb8d61ca1bbd8ee9ecc98334135eb70
|
| 3 |
+
size 4302122808
|
model-00120-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa8033ac21b053077e018e47b88a6e63d86c1019e3e6e716309ef9c1b85c14eb
|
| 3 |
+
size 4302384470
|
model-00122-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc62e20e8e31cd829802f1dee0a13e84ac63518c7f2d2d5ce219a174df15d0c8
|
| 3 |
+
size 1864917414
|
model-00146-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ef1d3a9e8a1af51ea191bf0f502fb9638258e44efdfed8c28741bbe0716110c
|
| 3 |
+
size 4302384961
|
model-00147-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88bda448fb7c45780da91e4b74c718996b54f298f6e0f43d3b53304ee6db00f6
|
| 3 |
+
size 4302122576
|
model-00148-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79b30b82b563eb7ef8329f90c878bfa6d89023150e9dfa5c5e32ac431bb0665b
|
| 3 |
+
size 4302384704
|
model-00149-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8dbc89f8dfabccecb73daddd84ed2968e377b83ebb29de222be798031446102
|
| 3 |
+
size 4302384963
|
model-00150-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55ca5774581611d741ffb9a3a92f543b5e766afeaf2634a7d1d8056fb659cc1e
|
| 3 |
+
size 4302122398
|
model-00151-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:28e8610d6ffed36dab61e4af0e43910c23c222084ce3f0fd64b404ad4ba36f4b
|
| 3 |
+
size 4302384890
|
model-00152-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:209a5b7b4ee8e072de03c406ea02aa9ea4c4aaa6d35fc9d9345e37cc2549c389
|
| 3 |
+
size 4302122786
|
model-00153-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3a04c397f5a1d9d0a5c9f8e3121af617cf462534e622e6b58da1d2134d635a9
|
| 3 |
+
size 4302384494
|
model-00154-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f4155c347885f1d194ee43833698a896aef646a675f5ed1844b4741af271821
|
| 3 |
+
size 4302384963
|
model-00155-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b7f90c03cc6687ddff6a0786d4da532ee38a1cd3cb98bcaee5bbbc57a1714e1
|
| 3 |
+
size 4302122598
|
model-00156-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d0cdb458d5dc78b86486c0d98ba1ffc8b2d10d13828cfb70943327639f9bc5c
|
| 3 |
+
size 4302384680
|
model-00157-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd31688d8aab534cad1b43db98f6502ef16c14a7886da8e0af003e2ab1ed9446
|
| 3 |
+
size 4302384963
|
model-00158-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08b9b3ba78cbb5ff5e2179ca8e5e6c459b1f3d5d2efaecc73e416683d4b85b4e
|
| 3 |
+
size 4302122420
|
model-00159-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b65fe157aa870201b61de28efdeafd4550e10db3e88bf051dafe2bfcf9bac04f
|
| 3 |
+
size 4302384870
|
model-00160-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44cda07c16fccd2218f7e4098e3b9ba46b9c1830673471a32a9a63fca9d90a74
|
| 3 |
+
size 5285723731
|
model-00161-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b477f7be8270a7ac94f568c1bc1c70d23b08ecc3bc96f1fc97f87522d5721bc6
|
| 3 |
+
size 4305819875
|
model-00162-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a62a72aae31a7d743379cc80d0d5877709ea3683326ef690184a2b4bc128f5f5
|
| 3 |
+
size 4302384938
|
model-00163-of-000163.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3dc1e3cd27e10f2533fe8c0f01fd71bd1dc81e999b913eb15405e42b18c295ef
|
| 3 |
+
size 6643591758
|
model.safetensors.index.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"add_bos_token": true,
|
| 3 |
+
"add_eos_token": false,
|
| 4 |
+
"bos_token": {
|
| 5 |
+
"__type": "AddedToken",
|
| 6 |
+
"content": "<|begin▁of▁sentence|>",
|
| 7 |
+
"lstrip": false,
|
| 8 |
+
"normalized": true,
|
| 9 |
+
"rstrip": false,
|
| 10 |
+
"single_word": false
|
| 11 |
+
},
|
| 12 |
+
"clean_up_tokenization_spaces": false,
|
| 13 |
+
"eos_token": {
|
| 14 |
+
"__type": "AddedToken",
|
| 15 |
+
"content": "<|end▁of▁sentence|>",
|
| 16 |
+
"lstrip": false,
|
| 17 |
+
"normalized": true,
|
| 18 |
+
"rstrip": false,
|
| 19 |
+
"single_word": false
|
| 20 |
+
},
|
| 21 |
+
"legacy": true,
|
| 22 |
+
"model_max_length": 131072,
|
| 23 |
+
"pad_token": {
|
| 24 |
+
"__type": "AddedToken",
|
| 25 |
+
"content": "<|end▁of▁sentence|>",
|
| 26 |
+
"lstrip": false,
|
| 27 |
+
"normalized": true,
|
| 28 |
+
"rstrip": false,
|
| 29 |
+
"single_word": false
|
| 30 |
+
},
|
| 31 |
+
"sp_model_kwargs": {},
|
| 32 |
+
"unk_token": null,
|
| 33 |
+
"tokenizer_class": "LlamaTokenizerFast",
|
| 34 |
+
"chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% if not thinking is defined %}{% set thinking = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, system_prompt='', is_first_sp=true, is_last_user=false, is_only_sys=false, is_prefix=false) %}{%- for message in messages %}{%- if message['role'] == 'system' %}{%- if ns.is_first_sp %}{% set ns.system_prompt = ns.system_prompt + message['content'] %}{% set ns.is_first_sp = false %}{%- else %}{% set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}{%- endif %}{% set ns.is_only_sys = true %}{%- endif %}{%- endfor %}{{ bos_token }}{{ ns.system_prompt }}{%- for message in messages %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{%- set ns.is_first = false -%}{%- set ns.is_last_user = true -%}{{'<|User|>' + message['content']}}{%- endif %}{%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}{%- if ns.is_last_user or ns.is_only_sys %}{{'<|Assistant|></think>'}}{%- endif %}{%- set ns.is_last_user = false -%}{%- set ns.is_first = false %}{%- set ns.is_tool = false -%}{%- for tool in message['tool_calls'] %}{%- if not ns.is_first %}{%- if message['content'] is none %}{{'<|tool▁calls▁begin|><|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- else %}{{message['content'] + '<|tool▁calls▁begin|><|tool▁call▁begin|>' + tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- endif %}{%- set ns.is_first = true -%}{%- else %}{{'<|tool▁call▁begin|>'+ tool['function']['name'] + '<|tool▁sep|>' + tool['function']['arguments'] + '<|tool▁call▁end|>'}}{%- endif %}{%- endfor %}{{'<|tool▁calls▁end|><|end▁of▁sentence|>'}}{%- endif %}{%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}{%- if ns.is_last_user %}{{'<|Assistant|>'}}{%- if message['prefix'] is defined and message['prefix'] and thinking %}{{'<think>'}}{%- else %}{{'</think>'}}{%- endif %}{%- endif %}{%- if message['prefix'] is defined and message['prefix'] %}{%- set ns.is_prefix = true -%}{%- endif %}{%- set ns.is_last_user = false -%}{%- if ns.is_tool %}{{message['content'] + '<|end▁of▁sentence|>'}}{%- set ns.is_tool = false -%}{%- else %}{%- set content = message['content'] -%}{%- if '</think>' in content %}{%- set content = content.split('</think>', 1)[1] -%}{%- endif %}{{content + '<|end▁of▁sentence|>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_last_user = false -%}{%- set ns.is_tool = true -%}{{'<|tool▁output▁begin|>' + message['content'] + '<|tool▁output▁end|>'}}{%- endif %}{%- if message['role'] != 'system' %}{% set ns.is_only_sys = false %}{%- endif %}{%- endfor -%}{% if add_generation_prompt and not ns.is_tool%}{% if ns.is_last_user or ns.is_only_sys or not ns.is_prefix %}{{'<|Assistant|>'}}{%- if not thinking %}{{'</think>'}}{%- else %}{{'<think>'}}{%- endif %}{% endif %}{% endif %}"
|
| 35 |
+
}
|