Skip to content

Commit

Permalink
update LLaVA-Next training scripts base on mlcd-vit-bigG-patch14-448
Browse files Browse the repository at this point in the history
  • Loading branch information
yiyexy committed Feb 14, 2025
1 parent 68a13e7 commit 26bc472
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 3 deletions.
4 changes: 2 additions & 2 deletions scripts/finetune_mlcd.sh
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ export PYTHONPATH=$(pwd)

LLM_VERSION="Qwen/Qwen2.5-7B-Instruct"
LLM_VERSION_CLEAN="${LLM_VERSION//\//_}"
VISION_MODEL_VERSION="DeepGlint-AI/mlcd-vit-large-patch14-336"
VISION_MODEL_VERSION="DeepGlint-AI/mlcd-vit-bigG-patch14-448"
VISION_MODEL_VERSION_CLEAN="${VISION_MODEL_VERSION//\//_}"
DATA_ROOT="/vlm/data/train_images"
PROJECTOR_NAME="pretrained_projector name"
Expand Down Expand Up @@ -40,7 +40,7 @@ ACCELERATE_CPU_AFFINITY=1 torchrun --nproc_per_node="${NUM_GPUS}" --nnodes="${NN
--mm_use_im_patch_token False \
--group_by_modality_length True \
--image_aspect_ratio anyres \
--image_grid_pinpoints "[(336, 672), (672, 336), (672, 672), (1008, 336), (336, 1008)]" \
--image_grid_pinpoints "[(448, 896), (896, 448), (896, 896), (1344, 448), (448, 1344)]" \
--mm_patch_merge_type spatial_unpad \
--bf16 True \
--run_name $BASE_RUN_NAME \
Expand Down
2 changes: 1 addition & 1 deletion scripts/pretrain_mlcd.sh
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ export PYTHONPATH=$(pwd)

LLM_VERSION="Qwen/Qwen2.5-7B-Instruct"
LLM_VERSION_CLEAN="${LLM_VERSION//\//_}"
VISION_MODEL_VERSION="DeepGlint-AI/mlcd-vit-large-patch14-336"
VISION_MODEL_VERSION="DeepGlint-AI/mlcd-vit-bigG-patch14-448"
VISION_MODEL_VERSION_CLEAN="${VISION_MODEL_VERSION//\//_}"
DATA_ROOT="llava 558k data root"

Expand Down

0 comments on commit 26bc472

Please sign in to comment.