diff --git a/sagemaker/configs/llama3-70b.json b/sagemaker/configs/llama3_1-70b.json similarity index 72% rename from sagemaker/configs/llama3-70b.json rename to sagemaker/configs/llama3_1-70b.json index 440fae416f0aa..2a7e86fa079b9 100644 --- a/sagemaker/configs/llama3-70b.json +++ b/sagemaker/configs/llama3_1-70b.json @@ -4,6 +4,7 @@ "sagemaker_instance_type": "ml.p4d.24xlarge", "env_vars": { "TENSOR_PARALLEL_SIZE": "8", - "DISABLE_CUSTOM_ALL_REDUCE": "true" + "DISABLE_CUSTOM_ALL_REDUCE": "true", + "MAX_MODEL_LEN": "32768" } } \ No newline at end of file diff --git a/sagemaker/configs/llama3-8b.json b/sagemaker/configs/llama3_1-8b.json similarity index 72% rename from sagemaker/configs/llama3-8b.json rename to sagemaker/configs/llama3_1-8b.json index 7f28d7f7708bf..076da16988a49 100644 --- a/sagemaker/configs/llama3-8b.json +++ b/sagemaker/configs/llama3_1-8b.json @@ -4,6 +4,7 @@ "sagemaker_instance_type": "ml.g5.2xlarge", "env_vars": { "TENSOR_PARALLEL_SIZE": "1", - "DISABLE_CUSTOM_ALL_REDUCE": "true" + "DISABLE_CUSTOM_ALL_REDUCE": "true", + "MAX_MODEL_LEN": "32768" } } \ No newline at end of file