File size: 356 Bytes
def8509 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
# Task Arithmetic - Grid Search
# Weights: 0.6, 0.4
base_model: Qwen/Qwen2.5-7B
models:
- model: Qwen/Qwen2.5-Math-7B-Instruct
parameters:
weight: 0.6
- model: Qwen/Qwen2.5-Coder-7B-Instruct
parameters:
weight: 0.4
merge_method: task_arithmetic
parameters:
normalize: false
lambda: 1.0
dtype: float16
tokenizer:
source: union
|