# V02.0X = lr scan, packing=truesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v02.00 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v02.00 zero3 '--learning_rate=1.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v02.00 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v02.00 --run_name=qwen-7B_codeforces-cot_v02.00 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v02.01 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v02.00 zero3 '--learning_rate=2.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v02.01 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v02.01 --run_name=qwen-7B_codeforces-cot_v02.01 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v02.02 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v02.00 zero3 '--learning_rate=4.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v02.02 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v02.02 --run_name=qwen-7B_codeforces-cot_v02.02 --wandb_entity huggingface --wandb_project open-r1'# V02.0X = lr scan, packing=truesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v02.10 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v02.00 zero3 '--learning_rate=1.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v02.10 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v02.10 --run_name=qwen-7B_codeforces-cot_v02.10 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v02.11 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v02.00 zero3 '--learning_rate=2.1e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v02.11 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v02.11 --run_name=qwen-7B_codeforces-cot_v02.11 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v02.12 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v02.00 zero3 '--learning_rate=4.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v02.12 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v02.12 --run_name=qwen-7B_codeforces-cot_v02.12 --wandb_entity huggingface --wandb_project open-r1'# V03.0X = lr scan, packing=truesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v03.00 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v03.00 zero3 '--learning_rate=1.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v03.00 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v03.00 --run_name=qwen-7B_codeforces-cot_v03.00 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v03.01 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v03.00 zero3 '--learning_rate=2.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v03.01 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v03.01 --run_name=qwen-7B_codeforces-cot_v03.01 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v03.02 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v03.00 zero3 '--learning_rate=4.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v03.02 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v03.02 --run_name=qwen-7B_codeforces-cot_v03.02 --wandb_entity huggingface --wandb_project open-r1'# V04.0X = lr scan, packing=truesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v04.00 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v04.00 zero3 '--learning_rate=1.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v04.00 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v04.00 --run_name=qwen-7B_codeforces-cot_v04.00 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v04.01 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v04.00 zero3 '--learning_rate=2.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v04.01 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v04.01 --run_name=qwen-7B_codeforces-cot_v04.01 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v04.02 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v04.00 zero3 '--learning_rate=4.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v04.02 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v04.02 --run_name=qwen-7B_codeforces-cot_v04.02 --wandb_entity huggingface --wandb_project open-r1'# V05.0X = lr scan, packing=truesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v05.00 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v05.00 zero3 '--learning_rate=1.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v05.00 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v05.00 --run_name=qwen-7B_codeforces-cot_v05.00 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v05.01 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v05.00 zero3 '--learning_rate=2.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v05.01 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v05.01 --run_name=qwen-7B_codeforces-cot_v05.01 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v05.02 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v05.00 zero3 '--learning_rate=4.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v05.02 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v05.02 --run_name=qwen-7B_codeforces-cot_v05.02 --wandb_entity huggingface --wandb_project open-r1'# V06.0X = lr scan, packing=truesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v06.00 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v06.00 zero3 '--learning_rate=1.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v06.00 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v06.00 --run_name=qwen-7B_codeforces-cot_v06.00 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v06.01 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v06.00 zero3 '--learning_rate=2.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v06.01 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v06.01 --run_name=qwen-7B_codeforces-cot_v06.01 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v06.02 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v06.00 zero3 '--learning_rate=4.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v06.02 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v06.02 --run_name=qwen-7B_codeforces-cot_v06.02 --wandb_entity huggingface --wandb_project open-r1'# V06.0X = lr scan, packing=falsesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v06.10 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v06.00 zero3 '--learning_rate=1.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v06.10 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v06.10 --run_name=qwen-7B_codeforces-cot_v06.10 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v06.11 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v06.00 zero3 '--learning_rate=2.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v06.11 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v06.11 --run_name=qwen-7B_codeforces-cot_v06.11 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v06.12 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v06.00 zero3 '--learning_rate=4.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v06.12 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v06.12 --run_name=qwen-7B_codeforces-cot_v06.12 --wandb_entity huggingface --wandb_project open-r1'# V07.0X = lr scan, packing=truesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v07.00 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v07.00 zero3 '--learning_rate=1.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v07.00 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v07.00 --run_name=qwen-7B_codeforces-cot_v07.00 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v07.01 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v07.00 zero3 '--learning_rate=2.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v07.01 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v07.01 --run_name=qwen-7B_codeforces-cot_v07.01 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v07.02 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v07.00 zero3 '--learning_rate=4.0e-5 --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v07.02 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v07.02 --run_name=qwen-7B_codeforces-cot_v07.02 --wandb_entity huggingface --wandb_project open-r1'# V07.0X = lr scan, packing=falsesbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v07.10 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v07.00 zero3 '--learning_rate=1.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v07.10 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v07.10 --run_name=qwen-7B_codeforces-cot_v07.10 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v07.11 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v07.00 zero3 '--learning_rate=2.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v07.11 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v07.11 --run_name=qwen-7B_codeforces-cot_v07.11 --wandb_entity huggingface --wandb_project open-r1'sbatch --mail-type=ALL --mail-user=lewis+hfc@huggingface.co --output=/fsx/h4/logs/%x-%j.out --err=/fsx/h4/logs/%x-%j.err --job-name=qwen-7B_codeforces-cot_v07.12 --nodes=1 slurm/train.slurm Qwen2.5-Coder-7B-Instruct sft v07.00 zero3 '--learning_rate=4.0e-5 --packing=false --hub_model_id=open-r1/Qwen2.5-Coder-7B-Instruct-SFT --hub_model_revision=v07.12 --output_dir=data/Qwen2.5-Coder-7B-Instruct-SFT-v07.12 --run_name=qwen-7B_codeforces-cot_v07.12 --wandb_entity huggingface --wandb_project open-r1'
Uh oh!
There was an error while loading.Please reload this page.
Saving for reference, no need to review:
LR scan