riczhou commited on
Commit
3a1d6db
·
verified ·
1 Parent(s): 0b0fd75

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3",
4
+ "quantization": "q0f16",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 4096,
8
+ "intermediate_size": 12288,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 32,
11
+ "num_hidden_layers": 36,
12
+ "num_key_value_heads": 8,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128
23
+ },
24
+ "vocab_size": 151936,
25
+ "context_window_size": 40960,
26
+ "sliding_window_size": -1,
27
+ "prefill_chunk_size": 2048,
28
+ "attention_sink_size": -1,
29
+ "tensor_parallel_shards": 1,
30
+ "pipeline_parallel_stages": 1,
31
+ "temperature": 0.6,
32
+ "presence_penalty": 0.0,
33
+ "frequency_penalty": 0.0,
34
+ "repetition_penalty": 1.0,
35
+ "top_p": 0.95,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "vocab.json",
39
+ "merges.txt",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_level",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "qwen2",
49
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "You are a helpful assistant.",
51
+ "system_prefix_token_ids": null,
52
+ "add_role_after_system_message": true,
53
+ "roles": {
54
+ "user": "<|im_start|>user",
55
+ "assistant": "<|im_start|>assistant"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ "<|im_end|>\n"
65
+ ],
66
+ "role_content_sep": "\n",
67
+ "role_empty_sep": "\n",
68
+ "stop_str": [
69
+ "<|endoftext|>",
70
+ "<|im_end|>"
71
+ ],
72
+ "stop_token_ids": [
73
+ 151643,
74
+ 151645
75
+ ],
76
+ "function_string": "",
77
+ "use_function_calling": false
78
+ },
79
+ "pad_token_id": 151643,
80
+ "bos_token_id": 151643,
81
+ "eos_token_id": [
82
+ 151645,
83
+ 151643
84
+ ]
85
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15dee143bcc3de5655213ea9e40180d7332afda0dbc30601945740a296ef29bd
3
+ size 1244659712
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9323ec98d0d298e8c0168def3b8aa4b5d8dbe21405e180c81295d8cb3e76b4d2
3
+ size 1244659712
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8951cda41167c55c60dc0cbd07b8c8d55b9e847fc8d89226349f473dd0e8ae5
3
+ size 100663296
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9de76b31a2ec1856c6cba7de745abba7a1f1171d5de577a9e0825e79e4b9d8aa
3
+ size 50331648
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49e653c7b39575fce8b8171cd9dedbc9657f14dc2abbdbbe36213f0bc02de215
3
+ size 33554432
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bf52710a99f61df3ee9ae2097f819bf529997e6380933109f46d46de5aa59e2
3
+ size 100663296
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:308de56fd6e7bffd4429524b24ba73864d22e333fde7e36262cfe28bc2243e8a
3
+ size 201326592
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef1ccf01b2485d497912443f4029e6dd7a54d63ebceb43dbd8afc01710e6fb81
3
+ size 50331648
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f578ee440dd9e489b0f29e2e88b4bc8702cd5cead2d23dd7abec08a068ae3b6
3
+ size 33554432
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:147f2bed7e463977afdac96497531721afd6ff8afef8fedcf1f74c0c72f70989
3
+ size 100663296
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43b1424c369f740eb4634d45317e0ccd548da9a03a5912d3fb93c6bdc2a6e8f9
3
+ size 201326592
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46143f4fc0bf674a519d981c61cb5d8bd38e17d2dbd333f86ff68c057554a585
3
+ size 50331648
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9db23ebb5bb2ff243094d6cafe8ca791610f6fcab620c92601c6f8ac481b7a6
3
+ size 33554432
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:914ebe292bcae5188c5d39ea7a97f37d7b800be972ee6d05fe94c772ec64a037
3
+ size 201326592
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f218c656dcddd7f7a30fc70ad0965dcf7d46a48ca46a0a69a82ccc05588cb9d
3
+ size 201326592
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9b617cd0d34b244d89a7a6961ba43ff8b878453d8d33efc2a5d32a876b8c547
3
+ size 50331648
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae72c534432352532825fe8367e8b3138a898b11ee5aaa80e44b0201b4630f0f
3
+ size 33554432
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd9ce8a0cb116caef3de2ed668f30ce571f338480971f5050df5b7e7431be501
3
+ size 100663296
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:548b74ae7c143b977afff82230e8576d62b524ed48763872d81c543a59a55f73
3
+ size 100663296
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82d0274dd3b2783a6e7cc496e5ee950b9558ab60543285c2549d6b0c9b289bf4
3
+ size 201326592
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e39595f86d080ac1bb614a52d799ef86da586029470f922816b30f949d2e3f7
3
+ size 50331648
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab6132aebe56001d6d95088c4ca889f5d2d1c29a51bf6bd130f888873fefb92a
3
+ size 33554432
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f1354e04c7410b512f422c2d61d3ea58197258a210155b5529e21c2d60d9535
3
+ size 100663296
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd420b108f83a240f46b03f1142cc5b86ce7e8c9a12ed7353beab29838b1d914
3
+ size 201326592
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:311afd2dd65bb0383d84c9ced7d0e01675b9da63d1b094c7292b00f5ebbd654d
3
+ size 50331648
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42a7140faa8ed2af18c60f11f2fc7bf737cc23c61660029172068adab4b1dbed
3
+ size 50331648
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c07aa1340c9a742938dcc230838e78dd1369f86952f9de28854a0caa484055d8
3
+ size 33554432
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07af13ce2b9f51556a6c088c984d57f9e822afb601d1633025f48ed0ba9021d1
3
+ size 100663296
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cb49c183b07e688b72788ee82f236501f278f18d75bef13b9b07a6b120043ce
3
+ size 201326592
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3ee659ee66bd1b1db116a51f75567d961e4338d6be9e41cf6ea93e567924656
3
+ size 50331648
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93ac4073acf4b2d85fa3733f2d7d2563264576e288b07b9d3bbb881c782c4499
3
+ size 33554432
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c61ee45413706a0ed1873c19b06905e4ada766cf2951c160bcec4ac6ec32bb0
3
+ size 100663296
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a99e914b43b86f1d2d9c5515d30c73d944595e3e4a796937e9b4e793eb201ad2
3
+ size 201326592
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14be5751fdfb421d262654a5dc4b54427cba5a34078f43342bfd6c61cb61cbad
3
+ size 50331648
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2828a7cc6d58171d7178a53c64e4db0d77c519935e48c0d5c26aeaf9555348c0
3
+ size 33554432
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56082bec02e69ea92106e45032c4deec40479b0a7fdf6f6d6d813f25c843f55b
3
+ size 33554432
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c05f2d082a03d0112890eb475130225a2b990f381d90671cb45d58350abd1429
3
+ size 100663296
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:426082766d670f0219bf3d75b9227a25d77a9e56d4d7e8c097c4c91e473152a5
3
+ size 201326592
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01e7a796f45599697fa9b2f101fbbf75d03a100cd890823c760fccae299013c6
3
+ size 50331648
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa1f53ab02f786865e83d2fd6c3471829845366e3600df7773f5d563ad4781f3
3
+ size 33554432
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6de97dea4893c775084985de90226ac139f731ca2e22fb5a16be718545f4b9a9
3
+ size 100663296
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0530f32c9fc1cce671bc599eaecbc1677fa960e9e04613f4a5b4829264f035ac
3
+ size 201326592
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d346d3a234b51664650d20654fde36495696dab3cda12c95cf48a4ac781fd0c
3
+ size 50331648
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:246e64a042c1362114c8ad603868fb4c8cd357784dba66f3c4f6432f236d7298
3
+ size 33554432
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df6d1f1238154f699937fff5e341f5b4e4dba8711fccd56e57242afa4b513bf7
3
+ size 100663296
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:146c9139f46c1413a6bb26ada9cf86d86ed5cc484b62008001c2eb235fba57d4
3
+ size 201326592