de-llama3-discoleo-instruct-8b-v0.1-x-meta-llama-3-8b-instruct-della_linear-50_50
/
mergekit_config.yml
| merge_method: della_linear | |
| models: | |
| - model: DiscoResearch/Llama3-DiscoLeo-Instruct-8B-v0.1 | |
| parameters: | |
| weight: 0.5 | |
| - model: meta-llama/Meta-Llama-3-8B-Instruct | |
| parameters: | |
| weight: 0.5 | |
| parameters: | |
| normalize: true | |
| int8_mask: true | |
| density: 0.5 | |
| lambda: 1.0 | |
| epsilon: 0.2 | |
| dtype: bfloat16 | |
| tokenizer: | |
| source: union | |
| base_model: meta-llama/Meta-Llama-3-8B-Instruct | |
| write_readme: README.md | |