fusion-bench
/

Llama-3.2-1B-Instruct_Bradly-Terry-RM_Preference-700k

Text Classification

text-generation-inference

Model card Files Files and versions

Metrics Training metrics Community

Llama-3.2-1B-Instruct_Bradly-Terry-RM_Preference-700k / hydra_output_2024-12-01_00-02-51 /.hydra /config.yaml

tanganke's picture

Upload folder using huggingface_hub

32c1ec9 verified 11 months ago

history blame contribute delete

2.6 kB

	fabric:
	loggers:
	_target_: lightning.fabric.loggers.TensorBoardLogger
	root_dir: outputs/logs
	name: llama_full_bradly_terry_rm
	version: null
	sub_dir: null
	default_hp_metric: false
	strategy:
	_target_: lightning.fabric.strategies.FSDPStrategy
	sharding_strategy: FULL_SHARD
	cpu_offload: false
	auto_wrap_policy:
	_target_: fusion_bench.mixins.lightning_fabric.get_policy
	_args_:
	- transformers.models.llama.modeling_llama.LlamaDecoderLayer
	activation_checkpointing_policy: ${.auto_wrap_policy}
	_target_: lightning.Fabric
	_recursive_: true
	devices: auto
	accelerator: auto
	precision: bf16-true
	method:
	_target_: fusion_bench.method.BradlyTerryRewardModeling
	_recursive_: false
	optimizer:
	_target_: torch.optim.AdamW
	lr: 0
	weight_decay: 0.001
	fused: null
	lr_scheduler:
	_target_: fusion_bench.optim.lr_scheduler.CosineDecayWithWarmup
	T_max: _T_max_
	init_lr: 0
	warmup_steps: 100
	max_lr: 5.0e-06
	min_lr: 1.0e-07
	dataloader_kwargs:
	batch_size: 8
	num_workers: 0
	pin_memory: true
	max_epochs: 2
	max_steps: -1
	max_steps_per_epoch: -1
	accumulate_grad_batches: 16
	lr_scheduler_interval: step
	lr_scheduler_frequency: 1
	checkpoint_save_interval: epoch
	checkpoint_save_frequency: 1
	gradient_clip_val: 1
	gradient_clip_algorithm: norm
	save_optimizer_state: false
	save_full_model: true
	save_ckpt_type: lightning
	ckpt_path: null
	max_length: 4096
	fix_token_embedding: true
	modelpool:
	_target_: fusion_bench.modelpool.CausalLMPool
	pretrained_model_name_or_path: meta-llama/Llama-3.2-1B-Instruct
	models:
	_pretrained_:
	_target_: fusion_bench.modelpool.seq_classification_lm.create_reward_model_from_pretrained
	pretrained_model_name_or_path: ${...pretrained_model_name_or_path}
	torch_dtype: bfloat16
	use_flash_attention_2: true
	tokenizer:
	_target_: transformers.AutoTokenizer.from_pretrained
	pretrained_model_name_or_path: ${..pretrained_model_name_or_path}
	pad_token: <\|end_of_text\|>
	train_datasets:
	preference_700k:
	_target_: fusion_bench.dataset.llama.preference_700k.load_tokenized_preference_700k_for_bradley_terry_rm
	tokenizer: ${...tokenizer}
	path: hendrydong/preference_700K
	split: train
	cache_path: null
	taskpool:
	_target_: fusion_bench.taskpool.DummyTaskPool
	model_save_path: null
	_target_: fusion_bench.programs.FabricModelFusionProgram
	_recursive_: false
	fast_dev_run: false
	dry_run: false
	print_config: true
	report_save_path: null
	print_function_call: true