diff --git a/lmdeploy/serve/turbomind/deploy.py b/lmdeploy/serve/turbomind/deploy.py index cc8db88f5..3aca6e1f1 100644 --- a/lmdeploy/serve/turbomind/deploy.py +++ b/lmdeploy/serve/turbomind/deploy.py @@ -984,7 +984,7 @@ def main(model_name: str, assert ((tp & (tp - 1) == 0) and tp != 0), 'tp should be 2^n' if model_format is None: - model_format = 'qwen' if model_name == 'qwen-7b' else 'hf' + model_format = 'qwen' if model_name.startswith('qwen') else 'hf' if model_format not in supported_formats: print(f'the model format "{model_format}" is not supported. '