File tree Expand file tree Collapse file tree
sub-packages/bionemo-evo2/src/bionemo/evo2/run Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -74,3 +74,28 @@ script: |-
7474 --disable-checkpointing \
7575 --early-stop-on-step=${stop_steps} \
7676 --create-tflops-callback;
77+ tests :
78+ - logic_type : static
79+ logic_spec :
80+ exit_codes :
81+ - 0
82+ baselines :
83+ consumed_samples :
84+ operator : eq
85+ value : 3072000.0
86+ val_loss :
87+ operator : range
88+ max : 0.6678
89+ min : 0.5630
90+ reduced_train_loss :
91+ operator : range
92+ max : 0.1372
93+ min : 0.0993
94+ TFLOPS_per_GPU :
95+ operator : range
96+ max : 719.5984
97+ min : 694.8020
98+ val_acc :
99+ operator : range
100+ max : 0.8462
101+ min : 0.7833
Original file line number Diff line number Diff line change @@ -16,7 +16,7 @@ script_args:
1616 workspace : /workspace/bionemo2
1717 data_path : /data/evo2
1818 artefacts_url : https://__token__:${JET_GITLAB_TOKEN}@gitlab-master.nvidia.com/api/v4/projects/180496/packages/pypi/simple
19- file_name_wheel : cuhyena==v0.2.3+cuda12.9
19+ file_name_wheel : subquadratic-ops
2020 model : evo2
2121 variant : train
2222 config_name : 1b
@@ -55,7 +55,7 @@ script: |-
5555 --enable-preemption \
5656 --ckpt-async-save \
5757 --use-megatron-comm-overlap-llama3-8k \
58- --use-b2b-causal-conv1d \
58+ --use-subquadratic_ops \
5959 --overlap-grad-reduce \
6060 --clip-grad=${clip_grad} \
6161 --eod-pad-in-loss-mask \
@@ -78,7 +78,7 @@ script: |-
7878 --limit-val-batches=20 \
7979 --log-every-n-steps=50 \
8080 --val-check-interval=500 \
81- --use-b2b-causal-conv1d \
81+ --use-subquadratic_ops \
8282 --create-tflops-callback \
8383 --create-tensorboard-logger \
8484 --result-dir=${tensorboard_dir} \
Original file line number Diff line number Diff line change @@ -76,7 +76,7 @@ script: |-
7676 --limit-val-batches=20 \
7777 --log-every-n-steps=50 \
7878 --val-check-interval=200 \
79- --use-b2b-causal-conv1d \
79+ --use-subquadratic_ops \
8080 --create-tflops-callback \
8181 --create-tensorboard-logger \
8282 --result-dir=${tensorboard_dir} \
Original file line number Diff line number Diff line change @@ -462,9 +462,9 @@ def parse_args(args: Optional[List[str]] = None) -> argparse.Namespace:
462462 help = "Dropout probability for the attention layers." ,
463463 )
464464 parser .add_argument (
465- "--use-b2b-causal-conv1d " ,
465+ "--use-subquadratic_ops " ,
466466 action = "store_true" ,
467- help = "Use back-to-back causal convolution CUDA kernel for hyena short conv layers for improved performance." ,
467+ help = "Use subquadratic_ops for improved performance." ,
468468 )
469469 parser .add_argument (
470470 "--save-top-k" ,
@@ -597,8 +597,8 @@ def train(args: argparse.Namespace) -> nl.Trainer:
597597 config_modifiers_init ["ffn_hidden_size" ] = args .ffn_hidden_size
598598 if args .use_targeted_variance_loss :
599599 config_modifiers_init ["use_targeted_variance_loss" ] = True
600- if args .use_b2b_causal_conv1d :
601- config_modifiers_init ["use_b2b_causal_conv1d " ] = True
600+ if args .use_subquadratic_ops :
601+ config_modifiers_init ["use_subquadratic_ops " ] = True
602602 if args .hybrid_override_pattern :
603603 config_modifiers_init ["hybrid_override_pattern" ] = args .hybrid_override_pattern
604604 if args .num_layers :
You can’t perform that action at this time.
0 commit comments