Add files using upload-large-folder tool
Browse files- config.json +33 -0
- model-00001-of-00123.safetensors +3 -0
- model-00003-of-00123.safetensors +3 -0
- model-00005-of-00123.safetensors +3 -0
- model-00007-of-00123.safetensors +3 -0
- model-00008-of-00123.safetensors +3 -0
- model-00018-of-00123.safetensors +3 -0
- model-00019-of-00123.safetensors +3 -0
- model-00024-of-00123.safetensors +3 -0
- model-00026-of-00123.safetensors +3 -0
- model-00031-of-00123.safetensors +3 -0
- model-00035-of-00123.safetensors +3 -0
- model-00038-of-00123.safetensors +3 -0
- model-00039-of-00123.safetensors +3 -0
- model-00040-of-00123.safetensors +3 -0
- model-00042-of-00123.safetensors +3 -0
- model-00045-of-00123.safetensors +3 -0
- model-00050-of-00123.safetensors +3 -0
- model-00051-of-00123.safetensors +3 -0
- model-00052-of-00123.safetensors +3 -0
- model-00057-of-00123.safetensors +3 -0
- model-00061-of-00123.safetensors +3 -0
- model-00062-of-00123.safetensors +3 -0
- model-00068-of-00123.safetensors +3 -0
- model-00069-of-00123.safetensors +3 -0
- model-00080-of-00123.safetensors +3 -0
- model-00081-of-00123.safetensors +3 -0
- model-00084-of-00123.safetensors +3 -0
- model-00090-of-00123.safetensors +3 -0
- model-00092-of-00123.safetensors +3 -0
- model-00107-of-00123.safetensors +3 -0
- model-00111-of-00123.safetensors +3 -0
- model-00116-of-00123.safetensors +3 -0
- mtp/model.safetensors +3 -0
config.json
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"Ernie4_5_MoeForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"bos_token_id": 1,
|
| 6 |
+
"eos_token_id": 2,
|
| 7 |
+
"dtype": "bfloat16",
|
| 8 |
+
"hidden_act": "silu",
|
| 9 |
+
"hidden_size": 8192,
|
| 10 |
+
"intermediate_size": 28672,
|
| 11 |
+
"max_position_embeddings": 131072,
|
| 12 |
+
"model_type": "ernie4_5_moe",
|
| 13 |
+
"num_attention_heads": 64,
|
| 14 |
+
"num_key_value_heads": 8,
|
| 15 |
+
"num_hidden_layers": 54,
|
| 16 |
+
"pad_token_id": 0,
|
| 17 |
+
"rms_norm_eps": 1e-05,
|
| 18 |
+
"use_cache": false,
|
| 19 |
+
"vocab_size": 103424,
|
| 20 |
+
"rope_theta": 500000,
|
| 21 |
+
"use_rmsnorm": true,
|
| 22 |
+
"use_bias": false,
|
| 23 |
+
"moe_num_experts": 64,
|
| 24 |
+
"moe_layer_start_index": 3,
|
| 25 |
+
"moe_intermediate_size": 3584,
|
| 26 |
+
"moe_capacity": [64,64,64],
|
| 27 |
+
"moe_gate": "topk",
|
| 28 |
+
"moe_k": 8,
|
| 29 |
+
"moe_layer_interval": 1,
|
| 30 |
+
"moe_use_aux_free": true,
|
| 31 |
+
"num_nextn_predict_layers": 1,
|
| 32 |
+
"tie_word_embeddings": false
|
| 33 |
+
}
|
model-00001-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24117041d4e899e901c24e376c026a7e1666770f96a9850e201d83875462cce4
|
| 3 |
+
size 4949345664
|
model-00003-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:766fe2b2b4dac61ebf336612abb9754a45fa2934b3b6193f04c592c34bdd7528
|
| 3 |
+
size 4932508544
|
model-00005-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f2df69178510adb5528e60163f1705c3abed2019d4d39b2e42ab8cce3ab58990
|
| 3 |
+
size 4932508536
|
model-00007-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:343de0ba07414a9ded28b968aca7ba6c167f10291816108ce3eba087ef1cb0e5
|
| 3 |
+
size 4884307232
|
model-00008-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97eb9e1a257acf472ce33897b8c0d1c30358961022c61652050e9db6bfa1e2ab
|
| 3 |
+
size 4932508544
|
model-00018-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:896eec3e53b61a5d25b658b6b999201be0889d56b790590b1dc2f50e45124e75
|
| 3 |
+
size 4884307248
|
model-00019-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0eb99e05db48ceacd66276edc2ed1154c2eef6f8b2e7142c94a8cbd8598b4743
|
| 3 |
+
size 4932508584
|
model-00024-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cc26117312da6a27f55b9eac65380a3aa2c18776366980de252601c7352f386
|
| 3 |
+
size 4932508600
|
model-00026-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:558ca54119524a3b80e40c2ca69a9bb884537057148bf88565694b1facc4963b
|
| 3 |
+
size 4932508584
|
model-00031-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a906d69dc07d4c35116a7e57d1d9cd9edba26f93fcb949e6662c20ab1144f26
|
| 3 |
+
size 4932508600
|
model-00035-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8695795c31fa945de452eec8fc31cc5665d02cb1bf599f3754baa30fd12ca8ef
|
| 3 |
+
size 4884307296
|
model-00038-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45acf7b5a5a0dd062c22a9f8755e36659fbb1e69f697d3735867bd0532e41196
|
| 3 |
+
size 4932508592
|
model-00039-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9bb8bd2dd471f45915e1a5f1b016293a666befbbf015422ed3bf5fc58d20c2d
|
| 3 |
+
size 4932508600
|
model-00040-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e301a82458d893dfc393c97b3ee4996b697419f579c3636999703f8b84c986af
|
| 3 |
+
size 4884307296
|
model-00042-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:470013eec6794347ea78efde0be1dc0ab7f35a0ea088ed48e2640ef930429b87
|
| 3 |
+
size 4884307296
|
model-00045-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb8bf6d8ab6f7fbbda07cb6f3612d036ec47fe431e80231af9b7fb4674963a1d
|
| 3 |
+
size 4932508592
|
model-00050-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2ba6d5ab2bb6b453b1655c9cd87a004100b6ba922153c42e4bf2a28822c5996
|
| 3 |
+
size 4932508600
|
model-00051-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5432e330c982641822eba79a19bd25be5c4c785126781d27a25d14ffbadbe221
|
| 3 |
+
size 4884307312
|
model-00052-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d8a4e0a158ea6e7cfb2c1fe2790e3143f8a310abae920c6179d7e0975a703cc
|
| 3 |
+
size 4932508584
|
model-00057-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f83e852446dcd7a3d65c474d13bb31824c7b68dea5fbf57b04554ab04a9edeb5
|
| 3 |
+
size 4932508600
|
model-00061-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c996d6b53895374ec0b2a3d0743727101e3287bcf3fc3adb9cf170a0cf35a7b
|
| 3 |
+
size 4884307296
|
model-00062-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3890b6fbad458d6cb8cd28c363cab7a6cebd721a71f65028d634eeeeaa4bb815
|
| 3 |
+
size 4932508600
|
model-00068-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:07d79686dcaf9b44bef253b9dedcd7b5867e92333f6680bc0f9c8fdc36cfacf7
|
| 3 |
+
size 4884307296
|
model-00069-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ccf0ac0683a0d160670d36a80d7cd279f676be505140888fef41f79038dda9e6
|
| 3 |
+
size 4932508600
|
model-00080-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0283a91ebc30ceb3449965ee6e89e7a77502c474835726367a1e4ad5d489894b
|
| 3 |
+
size 4884307296
|
model-00081-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ac2bd46b28e7835096beb0a6c764820acbc256f4f3069e6cf305419c1bad248
|
| 3 |
+
size 4932508600
|
model-00084-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39a5ce67ec4387349d6628897be31e3d135233cdaf57915a376c1434e74be469
|
| 3 |
+
size 4884307312
|
model-00090-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b1a0283d1c84fd455673fcac2038c8c102ce1fa3462396db75384c00a371ddb
|
| 3 |
+
size 4932508600
|
model-00092-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c935e6c0c854c1bbc891212af5c05c2a199b1b35663a27b515e00b8b1e0b71d0
|
| 3 |
+
size 4932508584
|
model-00107-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:09a858807cc18806eaf1dd2bfb61d132b81dba23791c8ceb1877bc8b9ffb58a7
|
| 3 |
+
size 4932508600
|
model-00111-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5c922dcd716c1df309343ed0ce902cd3af0f5d99b8bd8e926ce51124f0f1ede8
|
| 3 |
+
size 4932508592
|
model-00116-of-00123.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bec23fb7f94cf9d87e6d013f19f75989a8361c0190f25bfab0b56d3f7cd81792
|
| 3 |
+
size 4932508600
|
mtp/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dec8ac44db50f728a5036bd3c66c439b48176e84eb729b2414125a4c0ec0f48b
|
| 3 |
+
size 1979778072
|