hk311 commited on
Commit
c170ab0
·
verified ·
1 Parent(s): 514468a

Add files using upload-large-folder tool

Browse files
config.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Ernie4_5_MoeForCausalLM"
4
+ ],
5
+ "bos_token_id": 1,
6
+ "eos_token_id": 2,
7
+ "dtype": "bfloat16",
8
+ "hidden_act": "silu",
9
+ "hidden_size": 8192,
10
+ "intermediate_size": 28672,
11
+ "max_position_embeddings": 131072,
12
+ "model_type": "ernie4_5_moe",
13
+ "num_attention_heads": 64,
14
+ "num_key_value_heads": 8,
15
+ "num_hidden_layers": 54,
16
+ "pad_token_id": 0,
17
+ "rms_norm_eps": 1e-05,
18
+ "use_cache": false,
19
+ "vocab_size": 103424,
20
+ "rope_theta": 500000,
21
+ "use_rmsnorm": true,
22
+ "use_bias": false,
23
+ "moe_num_experts": 64,
24
+ "moe_layer_start_index": 3,
25
+ "moe_intermediate_size": 3584,
26
+ "moe_capacity": [64,64,64],
27
+ "moe_gate": "topk",
28
+ "moe_k": 8,
29
+ "moe_layer_interval": 1,
30
+ "moe_use_aux_free": true,
31
+ "num_nextn_predict_layers": 1,
32
+ "tie_word_embeddings": false
33
+ }
model-00001-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24117041d4e899e901c24e376c026a7e1666770f96a9850e201d83875462cce4
3
+ size 4949345664
model-00003-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:766fe2b2b4dac61ebf336612abb9754a45fa2934b3b6193f04c592c34bdd7528
3
+ size 4932508544
model-00005-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2df69178510adb5528e60163f1705c3abed2019d4d39b2e42ab8cce3ab58990
3
+ size 4932508536
model-00007-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:343de0ba07414a9ded28b968aca7ba6c167f10291816108ce3eba087ef1cb0e5
3
+ size 4884307232
model-00008-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97eb9e1a257acf472ce33897b8c0d1c30358961022c61652050e9db6bfa1e2ab
3
+ size 4932508544
model-00018-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:896eec3e53b61a5d25b658b6b999201be0889d56b790590b1dc2f50e45124e75
3
+ size 4884307248
model-00019-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eb99e05db48ceacd66276edc2ed1154c2eef6f8b2e7142c94a8cbd8598b4743
3
+ size 4932508584
model-00024-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cc26117312da6a27f55b9eac65380a3aa2c18776366980de252601c7352f386
3
+ size 4932508600
model-00026-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:558ca54119524a3b80e40c2ca69a9bb884537057148bf88565694b1facc4963b
3
+ size 4932508584
model-00031-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a906d69dc07d4c35116a7e57d1d9cd9edba26f93fcb949e6662c20ab1144f26
3
+ size 4932508600
model-00035-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8695795c31fa945de452eec8fc31cc5665d02cb1bf599f3754baa30fd12ca8ef
3
+ size 4884307296
model-00038-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45acf7b5a5a0dd062c22a9f8755e36659fbb1e69f697d3735867bd0532e41196
3
+ size 4932508592
model-00039-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9bb8bd2dd471f45915e1a5f1b016293a666befbbf015422ed3bf5fc58d20c2d
3
+ size 4932508600
model-00040-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e301a82458d893dfc393c97b3ee4996b697419f579c3636999703f8b84c986af
3
+ size 4884307296
model-00042-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:470013eec6794347ea78efde0be1dc0ab7f35a0ea088ed48e2640ef930429b87
3
+ size 4884307296
model-00045-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb8bf6d8ab6f7fbbda07cb6f3612d036ec47fe431e80231af9b7fb4674963a1d
3
+ size 4932508592
model-00050-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2ba6d5ab2bb6b453b1655c9cd87a004100b6ba922153c42e4bf2a28822c5996
3
+ size 4932508600
model-00051-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5432e330c982641822eba79a19bd25be5c4c785126781d27a25d14ffbadbe221
3
+ size 4884307312
model-00052-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d8a4e0a158ea6e7cfb2c1fe2790e3143f8a310abae920c6179d7e0975a703cc
3
+ size 4932508584
model-00057-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f83e852446dcd7a3d65c474d13bb31824c7b68dea5fbf57b04554ab04a9edeb5
3
+ size 4932508600
model-00061-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c996d6b53895374ec0b2a3d0743727101e3287bcf3fc3adb9cf170a0cf35a7b
3
+ size 4884307296
model-00062-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3890b6fbad458d6cb8cd28c363cab7a6cebd721a71f65028d634eeeeaa4bb815
3
+ size 4932508600
model-00068-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07d79686dcaf9b44bef253b9dedcd7b5867e92333f6680bc0f9c8fdc36cfacf7
3
+ size 4884307296
model-00069-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccf0ac0683a0d160670d36a80d7cd279f676be505140888fef41f79038dda9e6
3
+ size 4932508600
model-00080-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0283a91ebc30ceb3449965ee6e89e7a77502c474835726367a1e4ad5d489894b
3
+ size 4884307296
model-00081-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ac2bd46b28e7835096beb0a6c764820acbc256f4f3069e6cf305419c1bad248
3
+ size 4932508600
model-00084-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39a5ce67ec4387349d6628897be31e3d135233cdaf57915a376c1434e74be469
3
+ size 4884307312
model-00090-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b1a0283d1c84fd455673fcac2038c8c102ce1fa3462396db75384c00a371ddb
3
+ size 4932508600
model-00092-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c935e6c0c854c1bbc891212af5c05c2a199b1b35663a27b515e00b8b1e0b71d0
3
+ size 4932508584
model-00107-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09a858807cc18806eaf1dd2bfb61d132b81dba23791c8ceb1877bc8b9ffb58a7
3
+ size 4932508600
model-00111-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c922dcd716c1df309343ed0ce902cd3af0f5d99b8bd8e926ce51124f0f1ede8
3
+ size 4932508592
model-00116-of-00123.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bec23fb7f94cf9d87e6d013f19f75989a8361c0190f25bfab0b56d3f7cd81792
3
+ size 4932508600
mtp/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dec8ac44db50f728a5036bd3c66c439b48176e84eb729b2414125a4c0ec0f48b
3
+ size 1979778072