Commit d871453 1 parent 7d46c8d commit d871453 Copy full SHA for d871453
File tree 1 file changed +7
-0
lines changed
1 file changed +7
-0
lines changed Original file line number Diff line number Diff line change @@ -29,6 +29,7 @@ def main(args: argparse.Namespace):
29
29
tensor_parallel_size = args .tensor_parallel_size ,
30
30
trust_remote_code = args .trust_remote_code ,
31
31
dtype = args .dtype ,
32
+ max_model_len = args .max_model_len ,
32
33
enforce_eager = args .enforce_eager ,
33
34
kv_cache_dtype = args .kv_cache_dtype ,
34
35
quantization_param_path = args .quantization_param_path ,
@@ -150,6 +151,12 @@ def run_to_completion(profile_dir: Optional[str] = None):
150
151
parser .add_argument ('--trust-remote-code' ,
151
152
action = 'store_true' ,
152
153
help = 'trust remote code from huggingface' )
154
+ parser .add_argument (
155
+ '--max-model-len' ,
156
+ type = int ,
157
+ default = None ,
158
+ help = 'Maximum length of a sequence (including prompt and output). '
159
+ 'If None, will be derived from the model.' )
153
160
parser .add_argument (
154
161
'--dtype' ,
155
162
type = str ,
You can’t perform that action at this time.
0 commit comments