Skip to content

Commit 347bcfa

Browse files
committed
Update default.yaml
1 parent 24d8d16 commit 347bcfa

1 file changed

Lines changed: 4 additions & 4 deletions

File tree

example_yamls/default.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -20,11 +20,11 @@ vocab_size: 33
2020
expansion_ratio: 2.6667 # 8/3
2121
soft_logit_cap: 32.0
2222
attention_soft_cap: 64.0
23-
add_att_soft_cap: true
23+
add_att_soft_cap: false
2424
p_attention: false
2525
tie_embeddings: false
2626
unet: true
27-
token_dropout: true
27+
token_dropout: false
2828

2929
# Data Configuration
3030
input_bin: "data/omgprot50/omgprot50_train_*.bin"
@@ -38,7 +38,7 @@ mask_rate_steps: 2500
3838

3939
# Training Hyperparameters
4040
batch_size: 524288 # 8*64*1024 tokens
41-
grad_accum: 1
41+
grad_accum: 8
4242
num_steps: 50000
4343
cooldown_steps: 5000
4444
max_length: 1024
@@ -52,7 +52,7 @@ lr_embed: 0.06
5252
lr_head: 0.008
5353
lr_scalar: 0.04
5454
grad_clip: 0.0
55-
auto_grad_clip: true
55+
auto_grad_clip: false
5656
auto_grad_clip_percentile: 10
5757

5858
# Muon optimizer (for hidden layers)

0 commit comments

Comments
 (0)