{
"dataset_param": {
"dataset_type": "multimodal",
"basic_parameters": {
"data_path": "/your_llava_data_path/LLaVA-Pretrain/blip_laion_cc_sbu_558k.json",
"data_folder": "/your_llava_data_path/LLaVA-Pretrain/images/"
},
"preprocess_parameters": {
"image_reader_type": "CLIPImageProcessor",
"train_pipeline": {
"crop_size": {"height": 336, "width": 336},
"do_center_crop": true,
"do_convert_rgb":true,
"do_normalize": true,
"do_rescale": true,
"do_resize": true,
"pad2square": false,
"image_mean": [0.48145466, 0.4578275, 0.40821073],
"image_std": [0.26862954, 0.26130258, 0.27577711],
"resample": 3,
"rescale_factor": 0.00392156862745098,
"size": {"shortest_edge": 336}
}
},
"tokenizer_config": {
"hub_backend": "hf",
"autotokenizer_name": "AutoTokenizer",
"from_pretrained": "/your_llava_weights_path/vicuna-7b-v1.5",
"cache_dir":null,
"padding_side": "right",
"use_fast": false
},
"use_text_processer": true,
"template_name": "llava-plain",
"mm_use_im_start_end": false
},
"dataloader_param": {
"dataloader_mode": "sampler",
"shuffle": true,
"drop_last": true,
"pin_memory": true,
"sampler_type": "BaseRandomBatchSampler",
"collate_param": {
"model_name": "llava",
"pad_token_id": 0
}
}
}