-
Notifications
You must be signed in to change notification settings - Fork 3
Expand file tree
/
Copy pathtinystories_batch_size.sh
More file actions
31 lines (28 loc) · 1.08 KB
/
tinystories_batch_size.sh
File metadata and controls
31 lines (28 loc) · 1.08 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
WANDB_MODE=offline CUDA_VISIBLE_DEVICES=0 uv run train.py -m \
training.batch_size=256,128,64,32,16,8,4,2,1 \
optimizer.max_lr=1e-3 \
optimizer.weight_decay=0.01 \
optimizer.max_l2_norm=2.0 \
optimizer.betas="[0.9,0.95]" \
'logger.run_name=ts-bs${training.batch_size}'
WANDB_MODE=offline CUDA_VISIBLE_DEVICES=0 uv run train.py \
training.batch_size=512 \
optimizer.max_lr=1e-3 \
optimizer.weight_decay=0.01 \
optimizer.max_l2_norm=2.0 \
optimizer.betas="[0.9,0.95]" \
'logger.run_name=ts-bs${training.batch_size}'
WANDB_MODE=offline CUDA_VISIBLE_DEVICES=0 uv run train.py \
training.batch_size=768 \
optimizer.max_lr=1e-3 \
optimizer.weight_decay=0.01 \
optimizer.max_l2_norm=2.0 \
optimizer.betas="[0.9,0.95]" \
'logger.run_name=ts-bs${training.batch_size}'
WANDB_MODE=offline CUDA_VISIBLE_DEVICES=0 uv run train.py \
training.batch_size=1024 \
optimizer.max_lr=1e-3 \
optimizer.weight_decay=0.01 \
optimizer.max_l2_norm=2.0 \
optimizer.betas="[0.9,0.95]" \
'logger.run_name=ts-bs${training.batch_size}'