wandb_project: joy-caption-1 device_batch_size: 2 batch_size: 256 learning_rate: 0.001 warmup_samples: 18000 max_samples: 600000 save_every: 50000 test_every: 50000 use_amp: true grad_scaler: true lr_scheduler_type: cosine min_lr_ratio: 0.0 allow_tf32: true seed: 42 num_workers: 8 optimizer_type: adamw adam_beta1: 0.9 adam_beta2: 0.999 adam_eps: 1.0e-08 adam_weight_decay: 0.0 clip_grad_norm: 1.0 dataset: fancyfeast/joy-captioning-20240729a clip_model: google/siglip-so400m-patch14-384 text_model: meta-llama/Meta-Llama-3.1-8B resume: null gradient_checkpointing: false test_size: 2048 grad_scaler_init: 65536.0 max_caption_length: 257 num_image_tokens: 32 adapter_type: mlp text_model_dtype: float16