|
io: |
|
|
|
out_dir : "debug" |
|
eval_interval : 10 |
|
log_interval : 10 |
|
eval_iters : 5 |
|
eval_only : false |
|
always_save_checkpoint : true |
|
init_from : "scratch" |
|
resume_when_snapshot_available: false |
|
|
|
loader: |
|
batch_size : 4 |
|
max_seq_len : 768 |
|
dataset : "smiles" |
|
processed_dataset_ckpt : "processed_dataset_500000.pkl" |
|
fragment_creator : "rss" |
|
|
|
model: |
|
dim : 32 |
|
n_layers : 1 |
|
n_heads : 1 |
|
multiple_of : 16 |
|
dropout : 0.1 |
|
|
|
context: |
|
context_keys: ["logp", "sascore", "mol_weight"] |
|
context_dims : [1,1,1] |
|
|
|
optimizer: |
|
gradient_accumulation_steps : 4 |
|
learning_rate : 1e-4 |
|
max_iters : 20 |
|
weight_decay : 1e-1 |
|
beta1 : 0.9 |
|
beta2 : 0.95 |
|
grad_clip : 1.0 |
|
|
|
decay_lr : true |
|
warmup_iters : 10 |
|
lr_decay_iters : 100 |
|
min_lr : 0.0 |
|
|
|
dtype : "float16" |
|
compile : false |
|
label : "llama2-Debug" |
|
profile : false |