yuanxuewei's picture
Add files using upload-large-folder tool
8b40218 verified
{
"run_id": "0903_libero_goal_augsteps_0_wo_flash_attention_wo_augsteps_two_view_action_chunk_16_pretrained_vlm",
"run_root_dir": "./playground/Checkpoints",
"seed": 42,
"trackers": [
"jsonl",
"wandb"
],
"wandb_entity": "michaelyu-1101-fudanuniversity",
"wandb_project": "Internvla",
"is_debug": false,
"framework": {
"framework_py": "DinoQFormerACT",
"qwenvl": {
"base_vlm": "/mnt/phwfile/efm_t/zhuyangkun_tmp_need_del/exp/exp_08_09/manip_sys2_qwen25_3b_onevision_molmo_a0all_refsp20/checkpoint-20000",
"attn_implementation": "flash_attention_2",
"vl_hidden_dim": 2048
},
"dino": {
"dino_backbone": "dinov2_vitl14"
},
"layer_qformer": {
"qformer_end_layer": 37,
"qformer_start_layer": 36,
"num_query_tokens": 64,
"grad_scale": 0.5
},
"action_model": {
"action_model_type": "DiT-B",
"action_hidden_dim": 768,
"action_dim": 7,
"use_ema": false,
"future_action_window_size": 7,
"past_action_window_size": 0,
"repeated_diffusion_steps": 8
},
"reduce_in_full_precision": true
},
"datasets": {
"vlm_data": {
"dataformat": "llava_json",
"dataset_use": "asv2_conversation_en,asv2_detailed_description_en,asv2_region_captioning_en,coco_internvl_longcap_en,coco_karpathy_train_567_en,coco_negative_gpt4o_en,coco_poetry_zh,coco_rem_en_zh,cocorem_exist_yorn_en,cocotextv2_en,cocotextv2_gpt4o_en,okvqa_en,refcoco_grounding_aug_en,refcoco_grounding_en,tallyqa_coco_en,toloka_grounding_aug_en,vqav2_en,vsr_en",
"eval_dataset": "aokvqa_cauldron_llava_format",
"data_flatten": false,
"base_interval": 2,
"max_pixels": 50176,
"min_pixels": 784,
"fix_image_size": [
224,
224
],
"model_max_length": 1024,
"model_type": "qwen2.5vl",
"per_device_batch_size": 4
},
"vla_data": {
"dataset_py": "lerobot_libero",
"data_root_dir": "playground/Datasets/LEROBOT_LIBERO_DATA",
"data_mix": "libero_goal",
"action_type": "delta_qpos",
"CoT_prompt": "Your task is {instruction}. To identify the key objects for your task. Locate their bounding boxes in [x1,y1,x2,y2] format.",
"CoT_answer": "bbox",
"default_image_resolution": [
3,
224,
224
],
"per_device_batch_size": 16,
"load_all_data_for_training": true,
"obs": [
"image_0"
]
}
},
"trainer": {
"epochs": 100,
"max_train_steps": 100000,
"num_warmup_steps": 5000,
"save_interval": 10000,
"eval_interval": 1000,
"learning_rate": {
"base": 2.5e-05
},
"lr_scheduler_type": "cosine_with_min_lr",
"scheduler_specific_kwargs": {
"min_lr": 1e-06
},
"freeze_modules": "",
"loss_scale": {
"vla": 1.0,
"vlm": 0.1
},
"max_grad_norm": 1.0,
"warmup_ratio": 0.1,
"weight_decay": 0.0,
"logging_frequency": 10,
"gradient_clipping": 1.0,
"gradient_accumulation_steps": 1,
"optimizer": {
"name": "AdamW",
"betas": [
0.9,
0.95
],
"eps": 1e-08,
"weight_decay": 1e-08
},
"is_resume": false,
"resume_epoch": null,
"resume_step": null,
"enable_gradient_checkpointing": true,
"enable_mixed_precision_training": true
},
"output_dir": "./playground/Checkpoints/0903_libero_goal_augsteps_0_wo_flash_attention_wo_augsteps_two_view_action_chunk_16_pretrained_vlm"
}