riczhou commited on
Commit
b2f5abb
·
verified ·
1 Parent(s): fd2aa0b

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
mlc-chat-config.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen3",
4
+ "quantization": "q0f16",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 5120,
8
+ "intermediate_size": 17408,
9
+ "attention_bias": false,
10
+ "num_attention_heads": 40,
11
+ "num_hidden_layers": 40,
12
+ "num_key_value_heads": 8,
13
+ "rms_norm_eps": 1e-06,
14
+ "rope_theta": 1000000,
15
+ "vocab_size": 151936,
16
+ "tie_word_embeddings": false,
17
+ "context_window_size": 40960,
18
+ "prefill_chunk_size": 2048,
19
+ "tensor_parallel_shards": 1,
20
+ "head_dim": 128,
21
+ "dtype": "float32",
22
+ "max_batch_size": 128
23
+ },
24
+ "vocab_size": 151936,
25
+ "context_window_size": 40960,
26
+ "sliding_window_size": -1,
27
+ "prefill_chunk_size": 2048,
28
+ "attention_sink_size": -1,
29
+ "tensor_parallel_shards": 1,
30
+ "pipeline_parallel_stages": 1,
31
+ "temperature": 0.6,
32
+ "presence_penalty": 0.0,
33
+ "frequency_penalty": 0.0,
34
+ "repetition_penalty": 1.0,
35
+ "top_p": 0.95,
36
+ "tokenizer_files": [
37
+ "tokenizer.json",
38
+ "vocab.json",
39
+ "merges.txt",
40
+ "tokenizer_config.json"
41
+ ],
42
+ "tokenizer_info": {
43
+ "token_postproc_method": "byte_level",
44
+ "prepend_space_in_encode": false,
45
+ "strip_space_in_decode": false
46
+ },
47
+ "conv_template": {
48
+ "name": "qwen2",
49
+ "system_template": "<|im_start|>system\n{system_message}<|im_end|>\n",
50
+ "system_message": "You are a helpful assistant.",
51
+ "system_prefix_token_ids": null,
52
+ "add_role_after_system_message": true,
53
+ "roles": {
54
+ "user": "<|im_start|>user",
55
+ "assistant": "<|im_start|>assistant"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ "<|im_end|>\n"
65
+ ],
66
+ "role_content_sep": "\n",
67
+ "role_empty_sep": "\n",
68
+ "stop_str": [
69
+ "<|endoftext|>",
70
+ "<|im_end|>"
71
+ ],
72
+ "stop_token_ids": [
73
+ 151643,
74
+ 151645
75
+ ],
76
+ "function_string": "",
77
+ "use_function_calling": false
78
+ },
79
+ "pad_token_id": 151643,
80
+ "bos_token_id": 151643,
81
+ "eos_token_id": [
82
+ 151645,
83
+ 151643
84
+ ]
85
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab6de60fc7247485a3a773f487ef7566d30319d2e472c495fe57c9597bca66bb
3
+ size 1555824640
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f58b6a45b3069af53839f86b673e75c962781ea9ce548d8bc9a8b5cd9cc46178
3
+ size 178257920
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eceb515ace3348557fc66f9bbab1830b99cb94d6aa2cc163551cadb880b9e6c6
3
+ size 73400320
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3983f296bd0b301d1a01c3d3d2e896ecc9392617075c536dbc2fe282152e5311
3
+ size 52428800
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d7546eb7280c8c0600fd162446defd35a32cd8f299469d0f82070c92e590922
3
+ size 178257920
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d6bd04975f5b1c1995316fde123a054a8fb52c73000e41860c7a853cabafbc7
3
+ size 356515840
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e07622879eebca62760a66722aeb884b04b03115e1856a1772334342f09eb553
3
+ size 73400320
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eddbb569eba793e5cabbd5cf07e965a66ad3fdef8bff488ae24c995d2f19c43
3
+ size 52428800
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6f5fffa7ec6ef4c527f81076dfe898427c07e4faa8e558cb8fdf8e92dc9a6e2
3
+ size 178257920
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e451e33f6496806fde11ba85149bb7c9d3eecb112051212a7f40cb360717fb3
3
+ size 356515840
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:061ee4d6f0dd002d6732bfa70bf39ccf81ae644fa9707424275f659b04d47fed
3
+ size 73400320
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59eef84352e5dfd4230283aa0c877b8666347cbc4fe62839416e3cf63b9e0632
3
+ size 52428800
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:737cc12647d0f07be94d1e7dce3f8177036848586490d27aa21fc315a2b4b084
3
+ size 178257920
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbd7256e4d0b694afc27d6dc15a6adbc6b380817e1d9342174e408c6d86607f1
3
+ size 52428800
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f16a6de4ab268cce7ae734f0739e5c1482584a6c654d1f206b3509bc463fddf
3
+ size 356515840
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d090926d2d19d655e5f7e1372ac7b976878559954f1a10d1171239572ff48ec
3
+ size 73400320
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa1ac1c27788ef633a37b1681bd5b6c3420127f8b140b8dc12201e90ad1aab6
3
+ size 52428800
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82c4277ec8dc2b0c52810ea0c68fe1c75d92cff81770a79b1a3264f7d6bd1388
3
+ size 356515840
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b73c4ae12bf01b682b442bf4dbe08955983caad2e7fc5fbcf61305b6d248778d
3
+ size 73400320
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03c9116303044a9a701c73bc8ed86cffbb0043246c10b0856c37f705d604772c
3
+ size 52428800
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c065471e7c8566310cf0d87cdd61c07e1d3389e33f4ad47509f024b9b9907517
3
+ size 178257920
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a9e918df481446f0011136adddfa7cec0dd9fb89cb6a27970cceb36da17b097
3
+ size 178257920
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ada8000987abb06a0019ca0708d0fe35453311a0d9aebee8b1c29b23a3685678
3
+ size 356515840
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a990cc7c46e887350cb0e825a728a94b2bd4c81ccdad06e0160a17f86c481a51
3
+ size 73400320
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e98f56213cd5ce12bd135bf09beba2e2ece8b216f2a23f7856d21396889a539a
3
+ size 178257920
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02d7b4061499a27dc9a7b196f820b7d702bbb41055e597a90fc7e438b2070a50
3
+ size 52428800
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5511ba85aa57f0375e740695e6585c25d8b43580937f5c0a8426fd52dcf01fc
3
+ size 178257920
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b0c0e634e84ee725647e85fe1aed6871270b48a0fad77114a9f5167de562bea
3
+ size 356515840
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff7ecd796142dbcd4b25bda309d7d91937bb99f7d0aaec29ca4a1e70cf4cedb6
3
+ size 73400320
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:943c965dffa4c736e05330d616098de2e890b19e164665c50cb8216493d1b9c5
3
+ size 52428800
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff4ae654241c739f3e48c2efa9b6af6d7930e9631bc2586ac8b03ff417ad98ac
3
+ size 178257920
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d83747a75c2aec69aa71d6b6cc4dd1e7d35496667675353171eec8f548375d2
3
+ size 356515840
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03dc54329ce70243dc3a5f589bfc02f83ba7465dbf91d281751f0cb60847bf21
3
+ size 73400320
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:629278f9a9ca7d139cb1a5112899b6ed58ced0544e566d4e06d5c3205c9d4faa
3
+ size 52428800
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91c74c500cfe717d4086aacf2805f635c9005188902d593ef6903937f04c4a82
3
+ size 178257920
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5e833fca99896497ce6409507f27128ace274f375daa063105ddc3b946d36e0
3
+ size 356515840
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcd6e7f94edc6b6b9670dc39e39631ec948c4c6f3c8e70714e1fb5c79923be60
3
+ size 356515840
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4e11dba5c2dc508557f0433bf665181958cdf47a674f813be43faaaf55bb296
3
+ size 73400320
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be8c3298084fdd46a4b9b174227a1f119517dada88b0dfa70d070c7decb98900
3
+ size 52428800
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7036e419cc0980a6afb04c6305405d988fbbfc18eac96ed0db5a93bc62c3908b
3
+ size 178257920
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9104e5771cda5e1515f5bf7d453954e60f702b3111184f11c92d1e7c6b72fac
3
+ size 356515840
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aef71228ae67e12391b0e7832e8d78ca30f14b4afb68a4e6879be5e39e2eab9c
3
+ size 73400320
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73d16393066100539ffae1eead6e29e409758dd600148a2200723032f826c095
3
+ size 52428800
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9be6e9150fde5bcf0eabaea3dde13ca537ce42fbc5f655279de7635188ee34b3
3
+ size 73400320
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:724d267c3bd72509e1b06af4e85986d1e930cdc4c08b4d69517c9dcb92a836d3
3
+ size 52428800
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8d319e2d76a8f3f9985e8aab987f35c6a50b8cfc659f0e83f6c19dc0d98c145
3
+ size 178257920