Skip to content

Commit 8d302c9

Browse files
committed
🔥 Remove unneeded configs
1 parent 4f74d57 commit 8d302c9

File tree

1 file changed

+0
-9
lines changed

1 file changed

+0
-9
lines changed

slime/configs/base.py

Lines changed: 0 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -84,15 +84,6 @@ def generate_train_args(self, models_path: Path, data_path: Path, is_infinite_ru
8484
--use-rotary-position-embeddings --rotary-base 1000000
8585
"""
8686

87-
QWEN3_0_5B_MODEL_ARGS = """
88-
--num-layers 24 --hidden-size 1024 --ffn-hidden-size 3072
89-
--num-attention-heads 16 --group-query-attention --num-query-groups 8
90-
--kv-channels 64 --vocab-size 151936
91-
--normalization RMSNorm --norm-epsilon 1e-6 --swiglu
92-
--disable-bias-linear --qk-layernorm
93-
--use-rotary-position-embeddings --rotary-base 1000000
94-
"""
95-
9687
DEFAULT_TRAINING_ARGS = """
9788
--tensor-model-parallel-size 2 --sequence-parallel
9889
--recompute-granularity full --recompute-method uniform --recompute-num-layers 1

0 commit comments

Comments
 (0)