-
Notifications
You must be signed in to change notification settings - Fork 515
Expand file tree
/
Copy pathsingle_gpu.sh
More file actions
executable file
·38 lines (37 loc) · 1.26 KB
/
single_gpu.sh
File metadata and controls
executable file
·38 lines (37 loc) · 1.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
#!/bin/bash
BEAKER_IMAGE="${1:-nathanl/open_instruct_auto}"
uv run python mason.py \
--cluster ai2/saturn \
--cluster ai2/jupiter \
--description "Single GPU DPO run with OLMo-core, for debugging purposes." \
--workspace ai2/open-instruct-dev \
--priority urgent \
--image "$BEAKER_IMAGE" \
--pure_docker_mode \
--preemptible \
--num_nodes 1 \
--budget ai2/oe-adapt \
--no_auto_dataset_cache \
--no-host-networking \
--env 'TORCH_LOGS=graph_breaks,recompiles' \
--gpus 1 -- torchrun --nproc_per_node=1 open_instruct/dpo.py \
--model_name_or_path allenai/OLMo-2-0425-1B \
--tokenizer_name_or_path allenai/OLMo-2-0425-1B \
--max_seq_length 1024 \
--per_device_train_batch_size 4 \
--gradient_accumulation_steps 1 \
--learning_rate 5e-07 \
--lr_scheduler_type linear \
--warmup_ratio 0.1 \
--weight_decay 0.0 \
--num_epochs 3 \
--output_dir output/dpo_olmo_core_debug/ \
--logging_steps 1 \
--mixer_list allenai/tulu-3-wildchat-reused-on-policy-8b 100 \
--chat_template_name olmo \
--exp_name "dpo-single-gpu-debug-$(date +%s)" \
--seed 123 \
--push_to_hub false \
--try_launch_beaker_eval_jobs false \
--try_auto_save_to_beaker false \
--with_tracking