Add a workaround for saving internvl2 with latest transformers (#2583)

* Add a workaround for saving internvl2 with latest transformers * fix lint * use arch
InternLM · Oct 17, 2024 · fec94c9 · fec94c9
1 parent b689cbc
commit fec94c9
Showing 1 changed file with 19 additions and 0 deletions.
diff --git a/lmdeploy/lite/apis/calibrate.py b/lmdeploy/lite/apis/calibrate.py
@@ -132,6 +132,24 @@ class name or the class type itself.
             print(f'Move {mod_name} to GPU.')
 
 
+# TODO to be removed
+def make_compatible_internvl_config(model_path):
+    """Patch model.config since after transformers v4.45.0, InternVL models
+    can't use `save_pretrained`"""
+    from lmdeploy.archs import get_model_arch
+    arch, _ = get_model_arch(model_path)
+    if arch == 'InternVLChatModel':
+        import transformers
+        from packaging import version
+        if version.parse(transformers.__version__) >= version.parse('4.45.0'):
+
+            def _get_non_default_generation_parameters(self):
+                return {}
+
+            from transformers import PretrainedConfig
+            PretrainedConfig._get_non_default_generation_parameters = _get_non_default_generation_parameters  # noqa
+
+
 def calibrate(model: str,
               calib_dataset: str = 'ptb',
               calib_samples: int = 128,
@@ -175,6 +193,7 @@ def calibrate(model: str,
         'Support only `c4`, `ptb`, `wikitext2` or `pileval`.'
 
     model_type, _ = get_task(model)
+    make_compatible_internvl_config(model)
     if model_type == 'llm':
         # Load tokenizer and configuration
         tokenizer = AutoTokenizer.from_pretrained(model,