diff --git a/sagemaker/configs/qwen2-vl-7b-instruct.json b/sagemaker/configs/qwen2-vl-7b-instruct.json new file mode 100644 index 0000000000000..41695098edb63 --- /dev/null +++ b/sagemaker/configs/qwen2-vl-7b-instruct.json @@ -0,0 +1,10 @@ +{ + "model": "Qwen/Qwen2-VL-7B-Instruct", + "image": "vllm:0.6.1.post2-2", + "sagemaker_instance_type": "ml.g5.12xlarge", + "env_vars": { + "PIPELINE_PARALLEL_SIZE": "1", + "TENSOR_PARALLEL_SIZE": "4", + "DISABLE_CUSTOM_ALL_REDUCE": "true" + } +} \ No newline at end of file