ScaleAI
/

swe-oec-7b

Model card Files Files and versions

swe-oec-7b / rlxf_job_config.yaml

jda's picture

Upload folder using huggingface_hub

32d9566 verified 6 months ago

history blame contribute delete

3.71 kB

	dataset: s3://scale-ml/users/niklas/swe-agent/train/mixed-smith7b-switch-smith32b/3000dagger-1000imitation
	debug: false
	eval_at_step_zero: null
	eval_case_report: false
	eval_case_report_only_splits: []
	eval_mode: false
	eval_steps: 0.2
	eval_strategy: steps
	experimental:
	activation_checkpointing: true
	enable_context_parallel: false
	mask_input_ids_by_flag: false
	pad_to_max_length: false
	pipeline_parallel_reshard: false
	pipeline_parallel_schedule: gpipe
	pipeline_parallel_size: 1
	pp_last_stage_offset: 0
	pp_share_train_eval_schedule: true
	torch_compile: false
	hyperparams:
	adam_beta1: 0.9
	adam_beta2: 0.999
	adam_epsilon: 1.0e-08
	adam_weight_decay: null
	constant_pack: false
	eval_num_rollouts_per_prompt: 1
	gradient_accumulation_steps: 4
	learning_rate: 5.0e-05
	loss_form: null
	lr_scheduler_kwargs: null
	lr_scheduler_type: cosine
	mask_instruct: true
	max_grad_norm: 1.0
	max_length: 32768
	num_rollouts_per_prompt: 1
	num_train_epochs: 3
	num_train_steps: -1
	online: false
	optimizer: adam
	per_device_eval_batch_size: 2
	per_device_micro_batch_size: 1
	per_device_train_batch_size: 2
	sleep_level: 2
	warmup_ratio: 0.06
	weight_decay: 0.01
	local_output_path: /mnt/nvme
	logging_rollouts: 0
	logging_steps: 1
	model_squad:
	lm:
	activation_checkpointing: true
	model_path: s3://scale-ml/users/niklas/models/SWE-smith-7b-sft-torchtune/epoch_2
	parallel_state:
	cp_mesh: null
	cp_size: 1
	device_type: cuda
	dp_size: 8
	pp_size: 1
	world_mesh: !!python/object:torch.distributed.device_mesh.DeviceMesh
	_coordinate_on_dim:
	- 0
	_dim_group_infos:
	- !!python/tuple
	- ptd:0
	- - 0
	- 1
	- 2
	- 3
	- 4
	- 5
	- 6
	- 7
	- '0'
	_flatten_mesh_list: !!python/tuple
	- 0
	- 1
	- 2
	- 3
	- 4
	- 5
	- 6
	- 7
	_hash: 5913564447349333664
	_thread_id: null
	device_type: cuda
	mesh: !!python/object/apply:torch._utils._rebuild_tensor_v2
	- !!python/object/apply:torch.storage._load_from_bytes
	- !!binary \|
	gAKKCmz8nEb5IGqoUBkugAJN6QMugAJ9cQAoWBAAAABwcm90b2NvbF92ZXJzaW9ucQFN6QNYDQAA
	AGxpdHRsZV9lbmRpYW5xAohYCgAAAHR5cGVfc2l6ZXNxA31xBChYBQAAAHNob3J0cQVLAlgDAAAA
	aW50cQZLBFgEAAAAbG9uZ3EHSwR1dS6AAihYBwAAAHN0b3JhZ2VxAGN0b3JjaApJbnRTdG9yYWdl
	CnEBWA4AAAA5NDY0MTQwNDM2MTI5NnECWAMAAABjcHVxA0sITnRxBFEugAJdcQBYDgAAADk0NjQx
	NDA0MzYxMjk2cQFhLggAAAAAAAAAAAAAAAEAAAACAAAAAwAAAAQAAAAFAAAABgAAAAcAAAA=
	- 0
	- !!python/tuple
	- 8
	- !!python/tuple
	- 1
	- false
	- !!python/object/apply:collections.OrderedDict
	- []
	mesh_dim_names: !!python/tuple
	- dp
	world_size: 8
	torch_compile: false
	use_fsdp2: true
	use_scale_llama: false
	processing_interface:
	class_name: BaseProcessingInterface
	module_path: trainers.processing_interface
	remote_object: {}
	resume: false
	s3_output_path: s3://scale-ml/users/niklas/models/mixed-smith7b-switch-smith32b/3000dagger-1000imitation
	save_at_step_zero: null
	save_final_model: true
	save_hf: true
	save_lr_scheduler: false
	save_optimizer: false
	save_s3_async: true
	save_steps: 0.2
	save_strategy: epoch
	task: sft
	use_device_mesh: true
	use_fsdp2: true
	use_scale_llama: false
	wandb:
	entity: gen-ai
	name: mixed-smith7b-switch-smith32b-3000dagger-1000imitation
	project: agent-rlxf
	wandb_host: https://scaleai.wandb.io/
	wandb_key_name: NIKLAS_WANDB_API_KEY
	wandb_secretsmanager_location: team/GENAIML/secret-store-key