lejelly's picture
Upload folder using huggingface_hub
def8509 verified
# Task Arithmetic - Grid Search
# Weights: 0.6, 0.4
base_model: Qwen/Qwen2.5-7B
models:
- model: Qwen/Qwen2.5-Math-7B-Instruct
parameters:
weight: 0.6
- model: Qwen/Qwen2.5-Coder-7B-Instruct
parameters:
weight: 0.4
merge_method: task_arithmetic
parameters:
normalize: false
lambda: 1.0
dtype: float16
tokenizer:
source: union