File tree Expand file tree Collapse file tree
recipes/codonfm_native_te Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -156,6 +156,12 @@ def __init__(
156156 "num_attention_heads" : 32 ,
157157 "num_hidden_layers" : 24 ,
158158 },
159+ "encodon_10b" : {
160+ "hidden_size" : 5120 ,
161+ "intermediate_size" : 20480 ,
162+ "num_attention_heads" : 40 ,
163+ "num_hidden_layers" : 34 ,
164+ },
159165}
160166
161167
Original file line number Diff line number Diff line change 1+ defaults :
2+ - defaults
3+ - _self_
4+
5+ # Training config
6+ model_preset : encodon_10b
7+ num_train_steps : 500_000
8+
9+ precision : bf16-mixed
10+
11+ use_sequence_packing : true
12+ dataset :
13+ data_path : ???
14+ micro_batch_size : 4
15+ num_workers : 1
16+ max_seq_length : 2048
17+
18+ # WandB config
19+ wandb_init_args :
20+ name : " codonfm_native_te_10b"
21+
22+ # Learning rate scheduler config
23+ lr_scheduler_kwargs :
24+ num_warmup_steps : 2_000
25+ num_training_steps : 500_000
26+
27+ checkpoint :
28+ ckpt_dir : ???
29+ resume_from_checkpoint : true
30+ save_every_n_steps : 1_000
31+
32+ logger :
33+ frequency : 100
Original file line number Diff line number Diff line change @@ -162,6 +162,12 @@ def __init__(
162162 "num_attention_heads" : 32 ,
163163 "num_hidden_layers" : 24 ,
164164 },
165+ "encodon_10b" : {
166+ "hidden_size" : 5120 ,
167+ "intermediate_size" : 20480 ,
168+ "num_attention_heads" : 40 ,
169+ "num_hidden_layers" : 34 ,
170+ },
165171}
166172
167173
You can’t perform that action at this time.
0 commit comments