Skip to content

Commit

Permalink
Merge remote-tracking branch 'origin/muon' into muon
Browse files Browse the repository at this point in the history
  • Loading branch information
dlwh committed Dec 12, 2024
2 parents 144e20f + 271479f commit 083835d
Showing 1 changed file with 10 additions and 0 deletions.
10 changes: 10 additions & 0 deletions error_loading_model.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
eval $(ssh-agent -s)
bash infra/babysit-tpu-vm.sh muon-debug -z us-central2-b -t v4-128 --preemptible -- \
WANDB_API_KEY=[WANDB_API_KEY] \
bash levanter/infra/run.sh python \
levanter/src/levanter/main/train_lm.py \
--config_path levanter/config/llama2_100M_muon.yaml \
--trainer.checkpointer.base_path gs://marin-us-central2/scratch/kaiyue/checkpoints/muon/llama2_100M_constant \
--optimizer.type muon \
--trainer.num_train_steps 10000 \
--trainer.load_checkpoint_path gs://marin-us-central2/scratch/kaiyue/checkpoints/muon/llama2_100M_constant/tjo9vxfb/step-4000

0 comments on commit 083835d

Please sign in to comment.