Llama-3-SS-Infused-R1776-70B / mergekit_config.yml
yasu-oh
add_model
76ac94f
# MergeKit configuration for SS infused R1-1776 (Llama3-70B based)
# yasu-oh/Llama-3-Swallow-Infused-R1776-70B + 0.4 * (shisa-ai/shisa-v2-llama3.3-70b - meta-llama/Llama-3.3-70B-Instruct)
merge_method: linear
dtype: bfloat16
models:
# BaseModel:
- model: ./Llama-3-Swallow-Infused-R1776-70B
parameters:
weight: 1.0
# Add: 0.4 * (Shisa V2 - Meta Llama3.3)
- model: ./shisa-v2-llama3.3-70b-pruned
parameters:
weight: 0.4
- model: ./Llama-3.3-70B-Instruct-pruned
parameters:
weight: -0.4
parameters:
normalize: true