Skip to content

Commit 73982f1

Browse files
author
Eric T. Dawson
committed
Merge branch 'main' of https://github.com/nvidia/bionemo-framework into edawson/scdl-schema
2 parents 9ecc929 + 555ee5f commit 73982f1

File tree

4 files changed

+9
-9
lines changed

4 files changed

+9
-9
lines changed

3rdparty/NeMo

Submodule NeMo updated from ee0be11 to f4f22a2

ci/benchmarks/partial-conv/evo2_pretrain.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ script_args:
1616
workspace: /workspace/bionemo2
1717
data_path: /data/evo2
1818
artefacts_url: https://__token__:${JET_GITLAB_TOKEN}@gitlab-master.nvidia.com/api/v4/projects/180496/packages/pypi/simple
19-
file_name_wheel: cuhyena==v0.2.3+cuda12.9
19+
file_name_wheel: subquadratic-ops
2020
model: evo2
2121
variant: train
2222
config_name: 1b
@@ -55,7 +55,7 @@ script: |-
5555
--enable-preemption \
5656
--ckpt-async-save \
5757
--use-megatron-comm-overlap-llama3-8k \
58-
--use-b2b-causal-conv1d \
58+
--use-subquadratic_ops \
5959
--overlap-grad-reduce \
6060
--clip-grad=${clip_grad} \
6161
--eod-pad-in-loss-mask \
@@ -78,7 +78,7 @@ script: |-
7878
--limit-val-batches=20 \
7979
--log-every-n-steps=50 \
8080
--val-check-interval=500 \
81-
--use-b2b-causal-conv1d \
81+
--use-subquadratic_ops \
8282
--create-tflops-callback \
8383
--create-tensorboard-logger \
8484
--result-dir=${tensorboard_dir} \

ci/benchmarks/perf/evo2_pretrain.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -76,7 +76,7 @@ script: |-
7676
--limit-val-batches=20 \
7777
--log-every-n-steps=50 \
7878
--val-check-interval=200 \
79-
--use-b2b-causal-conv1d \
79+
--use-subquadratic_ops \
8080
--create-tflops-callback \
8181
--create-tensorboard-logger \
8282
--result-dir=${tensorboard_dir} \

sub-packages/bionemo-evo2/src/bionemo/evo2/run/train.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -462,9 +462,9 @@ def parse_args(args: Optional[List[str]] = None) -> argparse.Namespace:
462462
help="Dropout probability for the attention layers.",
463463
)
464464
parser.add_argument(
465-
"--use-b2b-causal-conv1d",
465+
"--use-subquadratic_ops",
466466
action="store_true",
467-
help="Use back-to-back causal convolution CUDA kernel for hyena short conv layers for improved performance.",
467+
help="Use subquadratic_ops for improved performance.",
468468
)
469469
parser.add_argument(
470470
"--save-top-k",
@@ -597,8 +597,8 @@ def train(args: argparse.Namespace) -> nl.Trainer:
597597
config_modifiers_init["ffn_hidden_size"] = args.ffn_hidden_size
598598
if args.use_targeted_variance_loss:
599599
config_modifiers_init["use_targeted_variance_loss"] = True
600-
if args.use_b2b_causal_conv1d:
601-
config_modifiers_init["use_b2b_causal_conv1d"] = True
600+
if args.use_subquadratic_ops:
601+
config_modifiers_init["use_subquadratic_ops"] = True
602602
if args.hybrid_override_pattern:
603603
config_modifiers_init["hybrid_override_pattern"] = args.hybrid_override_pattern
604604
if args.num_layers:

0 commit comments

Comments
 (0)