| models: | |
| - model: Zhihu-ai/Zhi-writing-dsr1-14b | |
| - model: agentica-org/DeepCoder-14B-Preview | |
| - model: mergekit-community/Qwen2.5-14B-della-code | |
| - model: mergekit-community/Qwen2.5-14B-della-v2-dpo | |
| - model: mergekit-community/Qwen2.5-14B-della-V6-dpo | |
| - model: mergekit-community/Qwen2.5-14B-della-Nova-dpo | |
| - model: mergekit-community/Qwen2.5-14B-della-base-dpo | |
| - model: mergekit-community/Qwen2.5-14B-della-1M-dpo | |
| merge_method: karcher | |
| base_model: mergekit-community/Qwen2.5-14B-della-1M-dpo | |
| parameters: | |
| max_iter: 1000 | |
| tokenizer_source: base | |
| dtype: float16 | |
| int8_mask: true | |
| normalize: true |