stackvlm-2000 / train_config.json
patrickamadeus's picture
Upload step 2000 checkpoint
d28832c verified
{
"lr_mp": 5e-05,
"lr_vision_backbone": 0.0,
"lr_language_backbone": 5e-05,
"lr_full_decoder": 0.0,
"batch_size": 16,
"gradient_accumulation_steps": 8,
"max_grad_norm": 1.0,
"max_training_steps": 5000,
"stop_after_step": 5000,
"warmup_ratio": 0.03,
"stats_log_interval": 100,
"precision": "bf16",
"compile": false,
"log_train_samples": false,
"do_eval": true,
"eval_interval": 500,
"max_val_batches": 32,
"max_images_per_example": 1,
"max_sample_length": 6144,
"train_dataset_path": "patrickamadeus/the_cauldron",
"train_dataset_name": [
"all"
],
"train_split": "train",
"val_split": "validation",
"stream_dataset": true,
"dataloader_num_workers": 2,
"dataloader_pin_memory": true,
"enable_source_filter": true,
"allowed_dataset_sources": [
"dvqa",
"tallyqa",
"figureqa",
"ocrvqa",
"vqav2",
"clevr",
"cocoqa",
"textvqa",
"visual7w",
"st_vqa",
"docvqa",
"aokvqa",
"chartqa"
],
"relevance_min_rating": 1,
"image_correspondence_min_rating": 1,
"visual_dependency_min_rating": 1,
"formatting_min_rating": 1,
"wandb_entity": "HuggingFace",
"log_wandb": false,
"push_checkpoints_to_hub": true,
"save_training_state_to_hub": true,
"checkpoint_repo_pattern": "patrickamadeus/stackvlm-{i}",
"hf_private": false,
"push_final_model_to_hub": false,
"resume_from_vlm_checkpoint": false,
"resume_checkpoint_path": "patrickamadeus/stackvlm-1500",
"resume_start_step": 1500
}