mirror of
https://github.com/leigest519/ScreenCoder.git
synced 2026-02-13 10:12:46 +00:00
22 lines
647 B
YAML
22 lines
647 B
YAML
output_dir: /path/to/output/runs/Qwen2.5-VL-3B-Idefics-V3-RSN-ai2d-500steps
|
|
model_name_or_path: /path/to/models/Qwen2.5-VL-3B-Instruct
|
|
dataset_name: Idefics-ai2d
|
|
data_file_paths: /path/to/data/ai2d.jsonl
|
|
image_folders: /path/to/images
|
|
max_prompt_length: 1024
|
|
per_device_train_batch_size: 1
|
|
gradient_accumulation_steps: 2
|
|
logging_steps: 1
|
|
bf16: true
|
|
report_to: wandb
|
|
gradient_checkpointing: false
|
|
deepspeed: /path/to/config/zero3.json
|
|
attn_implementation: flash_attention_2
|
|
max_pixels: 401408
|
|
max_steps: 500
|
|
run_name: Qwen2.5-VL-3B-Idefics-V3-RSN-ai2d-500steps-multinode
|
|
save_steps: 100
|
|
save_total_limit: 3
|
|
save_only_model: true
|
|
num_generations: 8
|