Skip to content
Snippets Groups Projects
Commit 0fcbfb1f authored by Johann-Ludwig Herzog's avatar Johann-Ludwig Herzog
Browse files

added script for dummy training of LLaVA with vit-s and BEN data

parent 0f6536da
No related branches found
No related tags found
Loading
#!/bin/bash
deepspeed llava/train/train_mem.py \
--deepspeed ./scripts/zero2.json \
--model_name_or_path ../../../mnt/storagecube/johann/llava-v1.5-vit-s \
--version plain \
--data_path ./BEN_10.json \
--image_folder ./playground \
--vision_tower ./clip-S-224-16-zavras/ \
--mm_projector_type linear \
--tune_mm_mlp_adapter True \
--mm_vision_select_layer -2 \
--mm_use_im_start_end False \
--mm_use_im_patch_token False \
--bf16 True \
--output_dir ../../../mnt/storagecube/johann/checkpoints/llava-v1.5-7b-vit-s-pretrain-dummy \
--num_train_epochs 5 \
--per_device_train_batch_size 2 \
--per_device_eval_batch_size 4 \
--gradient_accumulation_steps 1 \
--evaluation_strategy "no" \
--save_strategy "no" \
--save_steps 24000 \
--save_total_limit 1 \
--learning_rate 1e-3 \
--weight_decay 0. \
--warmup_ratio 0.03 \
--lr_scheduler_type "cosine" \
--logging_steps 1 \
--tf32 True \
--model_max_length 2048 \
--gradient_checkpointing True \
--dataloader_num_workers 4 \
--lazy_preprocess True \
--report_to wandb \
--bits 8 \
--ben_lmdb_path ../../../data/kaiclasen/BENv2.lmdb \
--ben_meta_parquet ../../../data/kaiclasen/metadata.parquet \
--ben_snow_cloud_parquet ../../../data/kaiclasen/metadata_for_patches_with_snow_cloud_or_shadow.parquet \
--ben_image_size 224 \
--ben_channels 14
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment