Skip to content

Commit ad25818

Browse files
committed
fix typo
1 parent ffad13b commit ad25818

12 files changed

+29
-11
lines changed

scripts/pretrain_c4/llama_130m_apollo.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,6 @@ torchrun --standalone --nproc_per_node 4 main_pretrain.py \
2222
--weight_decay 0 \
2323
--project apollo_test \
2424
--name apollo_test_apollo_130m \
25-
--save_dir ./ckpts/Appollo_130m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
25+
--save_dir ./ckpts/Apollo_130m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
2626

2727

scripts/pretrain_c4/llama_130m_apollo_mini.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,6 @@ torchrun --standalone --nproc_per_node 4 main_pretrain.py \
2323
--weight_decay 0 \
2424
--project apollo_test \
2525
--name apollo_test_apollo_mini_130m \
26-
--save_dir ./ckpts/Appollo_130m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
26+
--save_dir ./ckpts/Apollo_130m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
2727

2828

scripts/pretrain_c4/llama_13b_apollo_mini.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,6 @@ torchrun --standalone --nproc_per_node 4 main_pretrain.py \
2222
--weight_decay 0 \
2323
--project apollo_test \
2424
--name apollo_test_apollo_mini_13b \
25-
--save_dir ./ckpts/Appollo_13b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
25+
--save_dir ./ckpts/Apollo_13b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
2626

2727

scripts/pretrain_c4/llama_1b_apollo.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,6 @@ torchrun --standalone --nproc_per_node 8 main_pretrain.py \
2222
--weight_decay 0 \
2323
--project apollo_test \
2424
--name apollo_test_apollo_1b \
25-
--save_dir ./ckpts/Appollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
25+
--save_dir ./ckpts/Apollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
2626

2727

scripts/pretrain_c4/llama_1b_apollo_mini.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,6 @@ torchrun --standalone --nproc_per_node 8 main_pretrain.py \
2222
--weight_decay 0 \
2323
--project apollo_test \
2424
--name apollo_test_apollo_mini_1b \
25-
--save_dir ./ckpts/Appollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
25+
--save_dir ./ckpts/Apollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
2626

2727

scripts/pretrain_c4/llama_350m_apollo.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,4 +22,4 @@ torchrun --standalone --nproc_per_node 4 main_pretrain.py \
2222
--update_proj_gap 200 \
2323
--project apollo_test \
2424
--name apollo_test_apollo_350m \
25-
--save_dir ./ckpts/Appollo_350m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
25+
--save_dir ./ckpts/Apollo_350m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}

scripts/pretrain_c4/llama_350m_apollo_mini.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -23,4 +23,4 @@ torchrun --standalone --nproc_per_node 4 main_pretrain.py \
2323
--update_proj_gap 200 \
2424
--project apollo_test \
2525
--name apollo_test_apollo_mini_350m \
26-
--save_dir ./ckpts/Appollo_350m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
26+
--save_dir ./ckpts/Apollo_350m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}

scripts/pretrain_c4/llama_60m_apollo.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,4 +22,4 @@ torchrun --standalone --nproc_per_node 1 main_pretrain.py \
2222
--weight_decay 0 \
2323
--project apollo_test\
2424
--name apollo_test_apollo_60m \
25-
--save_dir ./ckpts/Appollo_60m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
25+
--save_dir ./ckpts/Apollo_60m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}

scripts/pretrain_c4/llama_60m_apollo_mini.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -25,4 +25,4 @@ torchrun --standalone --nproc_per_node 1 main_pretrain.py \
2525
--weight_decay 0 \
2626
--project apollo_test\
2727
--name apollo_test_apollo_mini_60m \
28-
--save_dir ./ckpts/Appollo_60m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
28+
--save_dir ./ckpts/Apollo_60m_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}

scripts/pretrain_c4/llama_7b_adamw.sh

+18
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
# LLaMA-7B, Adamw, 8 A100, 1 Node
2+
3+
torchrun --standalone --nproc_per_node 8 main_pretrain.py \
4+
--model_config configs/llama_7b.json \
5+
--eval_every 1000 \
6+
--dtype bfloat16 \
7+
--batch_size 4 \
8+
--total_batch_size 512 \
9+
--lr 0.01 \
10+
--warmup_steps 15000 \
11+
--num_training_steps 150000 \
12+
--optimizer adamw \
13+
--weight_decay 0 \
14+
--project apollo_test \
15+
--name adamw_test_apollo_7b \
16+
--save_dir ./ckpts/Adamw_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
17+
18+

scripts/pretrain_c4/llama_7b_apollo.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,6 @@ torchrun --standalone --nproc_per_node 8 main_pretrain.py \
2222
--weight_decay 0 \
2323
--project apollo_test \
2424
--name apollo_test_apollo_7b \
25-
--save_dir ./ckpts/Appollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
25+
--save_dir ./ckpts/Apollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
2626

2727

scripts/pretrain_c4/llama_7b_apollo_mini.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -21,6 +21,6 @@ torchrun --standalone --nproc_per_node 8 main_pretrain.py \
2121
--weight_decay 0 \
2222
--project apollo_test \
2323
--name apollo_test_apollo_mini_7b \
24-
--save_dir ./ckpts/Appollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
24+
--save_dir ./ckpts/Apollo_7b_scale${apollo_scale}_rank${num_rank}_proj${proj_type}_type${scale_type}
2525

2626

0 commit comments

Comments
 (0)