File size: 356 Bytes
def8509
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
# Task Arithmetic - Grid Search
# Weights: 0.6, 0.4
base_model: Qwen/Qwen2.5-7B
models:
  - model: Qwen/Qwen2.5-Math-7B-Instruct
    parameters:
      weight: 0.6
  - model: Qwen/Qwen2.5-Coder-7B-Instruct
    parameters:
      weight: 0.4
merge_method: task_arithmetic
parameters:
  normalize: false
  lambda: 1.0
dtype: float16
tokenizer:
  source: union