From 3cb5a73d3789fd5712e017e1b1074d6704ae1fb0 Mon Sep 17 00:00:00 2001 From: Naman Nandan Date: Tue, 26 Sep 2023 16:32:16 -0700 Subject: [PATCH] Update path to sample input text for inf2 opt benchmark model (#2617) * update path to sample input text for inf2 opt benchmark model * test inf2 benchmark fix * Revert "test inf2 benchmark fix" This reverts commit 467930598607c9a05831c0cb3d40721bee98cf4e. --------- Co-authored-by: Naman Nandan --- benchmarks/models_config/opt_6.7b_neuronx.yaml | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/benchmarks/models_config/opt_6.7b_neuronx.yaml b/benchmarks/models_config/opt_6.7b_neuronx.yaml index 99df9cc78b..1dc0f0e63f 100644 --- a/benchmarks/models_config/opt_6.7b_neuronx.yaml +++ b/benchmarks/models_config/opt_6.7b_neuronx.yaml @@ -8,7 +8,7 @@ opt_6.7b_neuronx_batch_1: batch_delay: 100 batch_size: - 1 - input: "./examples/large_models/inferentia2/sample_text.txt" + input: "./examples/large_models/inferentia2/opt/sample_text.txt" requests: 2000 concurrency: 10 backend_profiling: False @@ -25,7 +25,7 @@ opt_6.7b_neuronx_batch_2: batch_delay: 100 batch_size: - 2 - input: "./examples/large_models/inferentia2/sample_text.txt" + input: "./examples/large_models/inferentia2/opt/sample_text.txt" requests: 2000 concurrency: 10 backend_profiling: False @@ -42,7 +42,7 @@ opt_6.7b_neuronx_batch_4: batch_delay: 100 batch_size: - 4 - input: "./examples/large_models/inferentia2/sample_text.txt" + input: "./examples/large_models/inferentia2/opt/sample_text.txt" requests: 2000 concurrency: 10 backend_profiling: False @@ -59,7 +59,7 @@ opt_6.7b_neuronx_batch_8: batch_delay: 100 batch_size: - 8 - input: "./examples/large_models/inferentia2/sample_text.txt" + input: "./examples/large_models/inferentia2/opt/sample_text.txt" requests: 2000 concurrency: 10 backend_profiling: False