JackBinary commited on
Commit
adfc334
·
verified ·
1 Parent(s): b97e672

Add files using upload-large-folder tool

Browse files
README.md ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: mlc-llm
3
+ base_model: knifeayumu/Cydonia-v1.3-Magnum-v4-22B
4
+ tags:
5
+ - mlc-llm
6
+ - web-llm
7
+ ---
8
+
9
+ # Cydonia-v1.3-Magnum-v4-22B-q4f16_1-MLC
10
+
11
+ This is the [Cydonia-v1.3-Magnum-v4-22B](https://huggingface.co/knifeayumu/Cydonia-v1.3-Magnum-v4-22B) model in MLC format `q4f16_1`.
12
+ The model can be used with [MLC-LLM](https://github.com/mlc-ai/mlc-llm) and [WebLLM](https://github.com/mlc-ai/web-llm).
13
+
14
+ ## Example Usage
15
+
16
+ Before using the examples, please follow the [installation guide](https://llm.mlc.ai/docs/install/mlc_llm.html#install-mlc-packages).
17
+
18
+ ### Chat CLI
19
+
20
+ ```bash
21
+ mlc_llm chat HF://JackBinary/Cydonia-v1.3-Magnum-v4-22B-q4f16_1-MLC
22
+ ````
23
+
24
+ ### REST Server
25
+
26
+ ```bash
27
+ mlc_llm serve HF://JackBinary/Cydonia-v1.3-Magnum-v4-22B-q4f16_1-MLC
28
+ ```
29
+
30
+ ### Python API
31
+
32
+ ```python
33
+ from mlc_llm import MLCEngine
34
+
35
+ model = "HF://JackBinary/Cydonia-v1.3-Magnum-v4-22B-q4f16_1-MLC"
36
+ engine = MLCEngine(model)
37
+
38
+ for response in engine.chat.completions.create(
39
+ messages=[{"role": "user", "content": "What is the meaning of life?"}],
40
+ model=model,
41
+ stream=True,
42
+ ):
43
+ for choice in response.choices:
44
+ print(choice.delta.content, end="", flush=True)
45
+ print("\n")
46
+
47
+ engine.terminate()
48
+ ```
49
+
50
+ ## Documentation
51
+
52
+ For more on MLC LLM, visit the [documentation](https://llm.mlc.ai/docs/) and [GitHub repo](https://github.com/mlc-ai/mlc-llm).
mlc-chat-config.json ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "mistral",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "hidden_size": 6144,
7
+ "intermediate_size": 16384,
8
+ "num_attention_heads": 48,
9
+ "num_hidden_layers": 56,
10
+ "rms_norm_eps": 1e-05,
11
+ "vocab_size": 32768,
12
+ "position_embedding_base": 1000000.0,
13
+ "num_key_value_heads": 8,
14
+ "head_dim": 128,
15
+ "context_window_size": 32768,
16
+ "sliding_window_size": -1,
17
+ "prefill_chunk_size": 8192,
18
+ "attention_sink_size": 4,
19
+ "tensor_parallel_shards": 1,
20
+ "max_batch_size": 128
21
+ },
22
+ "vocab_size": 32768,
23
+ "context_window_size": 32768,
24
+ "sliding_window_size": -1,
25
+ "prefill_chunk_size": 8192,
26
+ "attention_sink_size": 4,
27
+ "tensor_parallel_shards": 1,
28
+ "pipeline_parallel_stages": 1,
29
+ "temperature": 1.0,
30
+ "presence_penalty": 0.0,
31
+ "frequency_penalty": 0.0,
32
+ "repetition_penalty": 1.0,
33
+ "top_p": 1.0,
34
+ "tokenizer_files": [
35
+ "tokenizer.model",
36
+ "tokenizer.json",
37
+ "tokenizer_config.json"
38
+ ],
39
+ "tokenizer_info": {
40
+ "token_postproc_method": "byte_fallback",
41
+ "prepend_space_in_encode": false,
42
+ "strip_space_in_decode": false
43
+ },
44
+ "conv_template": {
45
+ "name": "mistral_default",
46
+ "system_template": "[INST] {system_message}",
47
+ "system_message": "Always assist with care, respect, and truth. Respond with utmost utility yet securely. Avoid harmful, unethical, prejudiced, or negative content. Ensure replies promote fairness and positivity.",
48
+ "system_prefix_token_ids": [
49
+ 1
50
+ ],
51
+ "add_role_after_system_message": false,
52
+ "roles": {
53
+ "user": "[INST]",
54
+ "assistant": "[/INST]",
55
+ "tool": "[INST]"
56
+ },
57
+ "role_templates": {
58
+ "user": "{user_message}",
59
+ "assistant": "{assistant_message}",
60
+ "tool": "{tool_message}"
61
+ },
62
+ "messages": [],
63
+ "seps": [
64
+ " "
65
+ ],
66
+ "role_content_sep": " ",
67
+ "role_empty_sep": "",
68
+ "stop_str": [
69
+ "</s>"
70
+ ],
71
+ "stop_token_ids": [
72
+ 2
73
+ ],
74
+ "function_string": "",
75
+ "use_function_calling": false
76
+ },
77
+ "pad_token_id": 0,
78
+ "bos_token_id": 1,
79
+ "eos_token_id": 2
80
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91fed35942c45a1a516d925b9465c3cd32d3d6a087dc71dd74742faf8ed0ca9b
3
+ size 100663296
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:671da3f1ffc36755829ca6c18d21f8fa92caecd3de887f1a0b41811af7ccab8f
3
+ size 100663296
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27ce564bb38c2d0346503d915f7703c4f658341ce6af93cdfb04da5aa3d4e7d5
3
+ size 18874368
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b5b47b5ae0b9f91c3f3ad012cbae666fc010ef7494cf96e1446e05346845096
3
+ size 24403968
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:240010d8388f55603cda1789c25b0cea647fa1717704ddf8f50b3189eef7d946
3
+ size 18874368
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c2376c5a08ce50697a316841ff287da0a471113b8869df722daf51980080780
3
+ size 50331648
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c690d47e985893853051daeb7b29be9380ee7e6ca0302fa58e70b9f74fcfb13
3
+ size 100663296
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d689be89a7dd16f6dd8c17457f60231b5eeb1aa16a2e3c8ee92b1ce008472832
3
+ size 24403968
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c07dff09b316722a196a900e321c3e4430d8534989247b75eccf00dd19bcf055
3
+ size 25165824
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8666900cd857d22741e244d62241be846a80ccda1fb627ef2fa884edd4a8df62
3
+ size 24403968
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f87edbaee425ceb1ea2a41d866e18c1bd33fa41547f6cd524dd239bcab523110
3
+ size 18874368
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8a5adfe810b1f94378fad41dad71a539b7e4a59d9cb60e080a2e8b73d952de7
3
+ size 24403968
params_shard_142.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aaad2a2408078cd0912cfb06c83caafe3b75d90f0bb8f5ca896b8ecd05a67e3
3
+ size 50331648
params_shard_153.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99b44354b4fdccd9397970fd348ff6816640df7bfe1b3152d0c30bc9b707b791
3
+ size 100663296
params_shard_166.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07feb3fd6987186cfac83e69d158efd3b730c419cdf8f472920901cb87bc4d9c
3
+ size 18874368
params_shard_175.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51057b9c20db5e71b320600bf8adcfcd6505feb79b3740e3046b3034fb2cd8d4
3
+ size 25165824
params_shard_202.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86298589bc92a3a2e04e11d2bb70067f082434210a1ada00299342c70955be57
3
+ size 50331648
params_shard_212.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b14885f5708141978df008545f840c73b6626372e956b3cc68ca9641cfb8872
3
+ size 50331648
params_shard_214.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cb380cf752c5a99abc4941f3bc086aa6456b0445d70f60750a408921369b058
3
+ size 24403968
params_shard_218.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f815a33d13da4a45eeecd37bcbdb24fb8dbe15306422cdf5a6333dd7e2f87dc
3
+ size 100663296
params_shard_219.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e54a19a4154d8dc7fe81c0986ae866f3d9fee9bbd42f89537afae2f954e6992c
3
+ size 24403968
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09ef45e3b0dbcadbeb836d99103101cf2f362ec4a677014c800bfa7f66585ab3
3
+ size 50331648
params_shard_220.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f75a5ad7e15136d59a5dd6892a0d723f958fb3f85a4cbe9ddd37ea010fe31f12
3
+ size 25165824
params_shard_221.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:624896234be4bfc96a589ae243ef73590719d9e2373978c78d1c9a1589ae44d8
3
+ size 18874368
params_shard_225.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:109a0b199704dbea9331de82d4b2938ec1810f500e62048e4e1f9ce6d17bfc26
3
+ size 25165824
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e2655765ce6575225d4cb12c84ac225ae6319d8da76382b38c463d32d8d3b2b
3
+ size 25165824
params_shard_251.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ed0974e28367934a7bbb8c3d2dc058898b8444ddb57bb12ddc7c8feebdbb8d7
3
+ size 18874368
params_shard_258.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fdd06f95eb6c5da17167fe7bd39624724c631267d0965b0f0c0b35ce387c4d2
3
+ size 100663296
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a60a20afcbedc9c553892777c026ceb7840fe611bc56e65e51b9a295eaaf7118
3
+ size 18874368
params_shard_261.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65326d1b8c9186f419342faf24c92aba6b41a304ebc09aec029a72af95dba7b6
3
+ size 18874368
params_shard_270.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d6c3bc7d49e662e2027510c8c72f26dddcf3cc2fb06d8561dcf57515ca52206
3
+ size 25165824
params_shard_273.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1fefb93b891a44ff333518884fbb9fc0c6549d3a6b67329ab6163ee58138f8e
3
+ size 100663296
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d9ac058a3c9bf22eb55e2d2e8765f20f49da4dafa03068a554190ee7c9a39cf
3
+ size 24403968
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0158322398f472ef9c7c690ab912bff4bc31b4bc8b2f2602b4283ec8581bd4f6
3
+ size 100663296
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1305c2db49d1d8956d77e23e98c7c5f0a7f3598cee0642c6284f7bd6f1e6bb10
3
+ size 18874368
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0734eacd84988b37f91403bba63af17fc5328e6d49825e938a1f434d10679172
3
+ size 25165824
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4c87f6601e4ddf59c8f927b1689612a5d942160b2cca7c145546c46cba5f242
3
+ size 100663296
params_shard_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6340c473a013d6aea481d639edefa9b6c0f24da1eee3bf82fc9b16c09546b6a5
3
+ size 18874368
params_shard_63.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a6abf0577bc0db20a40fccd3474d81e75f537c3376bf24788809f305f3d634e
3
+ size 100663296
params_shard_67.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59a1f0dc0df20367d3a8dc8689d380159f46bb8685a6328463b09c5da9f20ba8
3
+ size 50331648
params_shard_70.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5db0a700a1009d20c20e385e975167d0471aa5073c9e0741186a36d2b99a813a
3
+ size 25165824
params_shard_77.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e2739df32e7ecd6bde1f3916ec2be0521f0132f63975103dbf5185478934b50
3
+ size 50331648
params_shard_8.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b8c48fc9e03d26f8908c082c1f8e57ea2ec1e8ed056ee658859a78c1fbcacc0
3
+ size 100663296
params_shard_80.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:700a38b849183c69b29daaa6bbe8b5c58895b47bb64e8f5ad767e4161fade460
3
+ size 25165824
params_shard_82.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9e1eeeccc3cc6c39bdbf8255bd03d35d0db68c90989999d5a4b085d0f57fbde
3
+ size 50331648
params_shard_99.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b93eb78cf272e845a85d2457392313dccaf649852716cbe0f5f4c6e51a41b8
3
+ size 24403968
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff