Llama-3-SS-Infused-R1776-70B / mergekit_config.yml

yasu-oh

add_model

76ac94f 6 months ago

560 Bytes

	# MergeKit configuration for SS infused R1-1776 (Llama3-70B based)
	# yasu-oh/Llama-3-Swallow-Infused-R1776-70B + 0.4 * (shisa-ai/shisa-v2-llama3.3-70b - meta-llama/Llama-3.3-70B-Instruct)

	merge_method: linear
	dtype: bfloat16

	models:
	# BaseModel:
	- model: ./Llama-3-Swallow-Infused-R1776-70B
	parameters:
	weight: 1.0

	# Add: 0.4 * (Shisa V2 - Meta Llama3.3)
	- model: ./shisa-v2-llama3.3-70b-pruned
	parameters:
	weight: 0.4

	- model: ./Llama-3.3-70B-Instruct-pruned
	parameters:
	weight: -0.4

	parameters:
	normalize: true