File tree Expand file tree Collapse file tree 4 files changed +9
-9
lines changed
sub-packages/bionemo-evo2/src/bionemo/evo2/run Expand file tree Collapse file tree 4 files changed +9
-9
lines changed Original file line number Diff line number Diff line change @@ -16,7 +16,7 @@ script_args:
1616 workspace : /workspace/bionemo2
1717 data_path : /data/evo2
1818 artefacts_url : https://__token__:${JET_GITLAB_TOKEN}@gitlab-master.nvidia.com/api/v4/projects/180496/packages/pypi/simple
19- file_name_wheel : cuhyena==v0.2.3+cuda12.9
19+ file_name_wheel : subquadratic-ops
2020 model : evo2
2121 variant : train
2222 config_name : 1b
@@ -55,7 +55,7 @@ script: |-
5555 --enable-preemption \
5656 --ckpt-async-save \
5757 --use-megatron-comm-overlap-llama3-8k \
58- --use-b2b-causal-conv1d \
58+ --use-subquadratic_ops \
5959 --overlap-grad-reduce \
6060 --clip-grad=${clip_grad} \
6161 --eod-pad-in-loss-mask \
@@ -78,7 +78,7 @@ script: |-
7878 --limit-val-batches=20 \
7979 --log-every-n-steps=50 \
8080 --val-check-interval=500 \
81- --use-b2b-causal-conv1d \
81+ --use-subquadratic_ops \
8282 --create-tflops-callback \
8383 --create-tensorboard-logger \
8484 --result-dir=${tensorboard_dir} \
Original file line number Diff line number Diff line change @@ -76,7 +76,7 @@ script: |-
7676 --limit-val-batches=20 \
7777 --log-every-n-steps=50 \
7878 --val-check-interval=200 \
79- --use-b2b-causal-conv1d \
79+ --use-subquadratic_ops \
8080 --create-tflops-callback \
8181 --create-tensorboard-logger \
8282 --result-dir=${tensorboard_dir} \
Original file line number Diff line number Diff line change @@ -462,9 +462,9 @@ def parse_args(args: Optional[List[str]] = None) -> argparse.Namespace:
462462 help = "Dropout probability for the attention layers." ,
463463 )
464464 parser .add_argument (
465- "--use-b2b-causal-conv1d " ,
465+ "--use-subquadratic_ops " ,
466466 action = "store_true" ,
467- help = "Use back-to-back causal convolution CUDA kernel for hyena short conv layers for improved performance." ,
467+ help = "Use subquadratic_ops for improved performance." ,
468468 )
469469 parser .add_argument (
470470 "--save-top-k" ,
@@ -597,8 +597,8 @@ def train(args: argparse.Namespace) -> nl.Trainer:
597597 config_modifiers_init ["ffn_hidden_size" ] = args .ffn_hidden_size
598598 if args .use_targeted_variance_loss :
599599 config_modifiers_init ["use_targeted_variance_loss" ] = True
600- if args .use_b2b_causal_conv1d :
601- config_modifiers_init ["use_b2b_causal_conv1d " ] = True
600+ if args .use_subquadratic_ops :
601+ config_modifiers_init ["use_subquadratic_ops " ] = True
602602 if args .hybrid_override_pattern :
603603 config_modifiers_init ["hybrid_override_pattern" ] = args .hybrid_override_pattern
604604 if args .num_layers :
You can’t perform that action at this time.
0 commit comments