Upload fine-tuned intent detection model - 2025-06-24 14:04:19
Browse files- 0000050_adapters.safetensors +3 -0
- 0000100_adapters.safetensors +3 -0
- README.md +2 -2
- adapter_config.json +35 -0
- adapters.safetensors +3 -0
- model_config.json +9 -9
0000050_adapters.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:944413997cab576d5f7619f1cfb5c368e9e8eb7644ea5b01ee244f24fe2be3c4
|
| 3 |
+
size 2497239
|
0000100_adapters.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a4c814a70c1e82e10d9cf893bd7a3fa3b6c90cb1ee42cbd1e962de8e1a4df65
|
| 3 |
+
size 2497239
|
README.md
CHANGED
|
@@ -65,8 +65,8 @@ let model = try await LLMModelFactory.shared.loadContainer(
|
|
| 65 |
## Training Details
|
| 66 |
|
| 67 |
- **Fine-tuning Method**: LoRA with model fusion
|
| 68 |
-
- **Export Date**: 2025-06-
|
| 69 |
-
- **Fusion Completed**:
|
| 70 |
|
| 71 |
## Expected Outputs
|
| 72 |
|
|
|
|
| 65 |
## Training Details
|
| 66 |
|
| 67 |
- **Fine-tuning Method**: LoRA with model fusion
|
| 68 |
+
- **Export Date**: 2025-06-24T14:04:19.734671
|
| 69 |
+
- **Fusion Completed**: False
|
| 70 |
|
| 71 |
## Expected Outputs
|
| 72 |
|
adapter_config.json
ADDED
|
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"adapter_path": "/Users/hebertg/iOSDev/KnowledgeBase/MLX-Fine-Tuning-Pipeline/outputs/knowledgebase-adapter",
|
| 3 |
+
"batch_size": 2,
|
| 4 |
+
"config": null,
|
| 5 |
+
"data": "/Users/hebertg/iOSDev/KnowledgeBase/MLX-Fine-Tuning-Pipeline/outputs/mlx_data",
|
| 6 |
+
"fine_tune_type": "lora",
|
| 7 |
+
"grad_checkpoint": false,
|
| 8 |
+
"iters": 100,
|
| 9 |
+
"learning_rate": 0.0001,
|
| 10 |
+
"lora_parameters": {
|
| 11 |
+
"rank": 8,
|
| 12 |
+
"dropout": 0.0,
|
| 13 |
+
"scale": 20.0
|
| 14 |
+
},
|
| 15 |
+
"lr_schedule": null,
|
| 16 |
+
"mask_prompt": false,
|
| 17 |
+
"max_seq_length": 512,
|
| 18 |
+
"model": "mlx-community/Qwen2.5-1.5B-Instruct-4bit",
|
| 19 |
+
"num_layers": 16,
|
| 20 |
+
"optimizer": "adam",
|
| 21 |
+
"optimizer_config": {
|
| 22 |
+
"adam": {},
|
| 23 |
+
"adamw": {}
|
| 24 |
+
},
|
| 25 |
+
"resume_adapter_file": null,
|
| 26 |
+
"save_every": 50,
|
| 27 |
+
"seed": 0,
|
| 28 |
+
"steps_per_eval": 25,
|
| 29 |
+
"steps_per_report": 10,
|
| 30 |
+
"test": false,
|
| 31 |
+
"test_batches": 500,
|
| 32 |
+
"train": true,
|
| 33 |
+
"val_batches": 25,
|
| 34 |
+
"wandb": null
|
| 35 |
+
}
|
adapters.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a4c814a70c1e82e10d9cf893bd7a3fa3b6c90cb1ee42cbd1e962de8e1a4df65
|
| 3 |
+
size 2497239
|
model_config.json
CHANGED
|
@@ -1,11 +1,13 @@
|
|
| 1 |
{
|
| 2 |
"model_info": {
|
| 3 |
-
"model_id": "
|
| 4 |
"model_type": "intent_detection",
|
| 5 |
"version": "1.0",
|
| 6 |
-
"base_model": "mlx-community/Qwen2.5-1.5B-Instruct-4bit"
|
| 7 |
-
|
| 8 |
-
|
|
|
|
|
|
|
| 9 |
},
|
| 10 |
"inference_settings": {
|
| 11 |
"max_tokens": 256,
|
|
@@ -45,13 +47,11 @@
|
|
| 45 |
"examples": 5000,
|
| 46 |
"iterations": 100,
|
| 47 |
"training_completed": true,
|
| 48 |
-
"export_timestamp": "2025-06-
|
| 49 |
-
"fusion_completed": true
|
| 50 |
},
|
| 51 |
"ios_integration": {
|
| 52 |
-
"
|
| 53 |
-
"
|
| 54 |
-
"requires_download": false,
|
| 55 |
"system_prompt": "You are a helpful AI assistant for a knowledge-management app on an iPhone."
|
| 56 |
}
|
| 57 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"model_info": {
|
| 3 |
+
"model_id": "mlx-community/Qwen2.5-1.5B-Instruct-4bit",
|
| 4 |
"model_type": "intent_detection",
|
| 5 |
"version": "1.0",
|
| 6 |
+
"base_model": "mlx-community/Qwen2.5-1.5B-Instruct-4bit"
|
| 7 |
+
},
|
| 8 |
+
"adapter_files": {
|
| 9 |
+
"adapters": "adapters.safetensors",
|
| 10 |
+
"config": "adapter_config.json"
|
| 11 |
},
|
| 12 |
"inference_settings": {
|
| 13 |
"max_tokens": 256,
|
|
|
|
| 47 |
"examples": 5000,
|
| 48 |
"iterations": 100,
|
| 49 |
"training_completed": true,
|
| 50 |
+
"export_timestamp": "2025-06-24T14:04:19.734671"
|
|
|
|
| 51 |
},
|
| 52 |
"ios_integration": {
|
| 53 |
+
"adapter_path": "Model/adapters.safetensors",
|
| 54 |
+
"config_path": "Model/adapter_config.json",
|
|
|
|
| 55 |
"system_prompt": "You are a helpful AI assistant for a knowledge-management app on an iPhone."
|
| 56 |
}
|
| 57 |
}
|