oumi-ai · xrdaukar · Jan 29, 2025 · Jan 29, 2025 · Jan 29, 2025
diff --git a/configs/recipes/vision/qwen2_vl_2b/sft/train.yaml b/configs/recipes/vision/qwen2_vl_2b/sft/train.yaml
@@ -23,7 +23,7 @@ data:
         transform_num_workers: "auto"
         dataset_kwargs:
           processor_name: "Qwen/Qwen2-VL-2B-Instruct"
-          limit: 4096
+          # limit: 4096 # Uncomment to limit dataset size!
           return_tensors: True
       # - dataset_name: "HuggingFaceH4/llava-instruct-mix-vsft"
       #   split: "train"
@@ -32,7 +32,6 @@ data:
       #   transform_num_workers: "auto"
       #   dataset_kwargs:
       #     processor_name: "Qwen/Qwen2-VL-2B-Instruct"
-      #     limit: 8192
       #     return_tensors: True
 
 training:

diff --git a/configs/recipes/vision/smolvlm/sft/gcp_job.yaml b/configs/recipes/vision/smolvlm/sft/gcp_job.yaml
@@ -35,7 +35,7 @@ setup: |
   pip install uv && uv pip install '.[gpu]' hf_transfer
   # Install model from HF Hub. This tool increases download speed compared to
   # downloading the model during training.
-  HF_HUB_ENABLE_HF_TRANSFER=1 huggingface-cli download HuggingFaceTB/SmolVLM-Instruct
+  HF_HUB_ENABLE_HF_TRANSFER=1 huggingface-cli download HuggingFaceTB/SmolVLM-Instruct --exclude "onnx/*" "runs/*"
 
   pip install -U "transformers>=4.46,<4.47"
   pip install -U flash-attn --no-build-isolation

diff --git a/configs/recipes/vision/smolvlm/sft/train.yaml b/configs/recipes/vision/smolvlm/sft/train.yaml
@@ -24,7 +24,7 @@ data:
         transform_num_workers: "auto"
         dataset_kwargs:
           processor_name: "HuggingFaceTB/SmolVLM-Instruct"
-          limit: 4096
+          # limit: 4096 # Uncomment to limit dataset size!
           return_tensors: True
 
 training: