feat(model): Support gemma model (#1187)

eosphoros-ai · Feb 23, 2024 · f9d9f8f · f9d9f8f
1 parent e098619
commit f9d9f8f
Show file tree

Hide file tree

Showing 4 changed files with 56 additions and 3 deletions.
diff --git a/README.md b/README.md
@@ -142,6 +142,8 @@ At present, we have introduced several key features to showcase our current capa
   We offer extensive model support, including dozens of large language models (LLMs) from both open-source and API agents, such as LLaMA/LLaMA2, Baichuan, ChatGLM, Wenxin, Tongyi, Zhipu, and many more. 
 
   - News
+    - 🔥🔥🔥  [gemma-7b-it](https://huggingface.co/google/gemma-7b-it)
+    - 🔥🔥🔥  [gemma-2b-it](https://huggingface.co/google/gemma-2b-it)
     - 🔥🔥🔥  [SOLAR-10.7B](https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0)
     - 🔥🔥🔥  [Mixtral-8x7B](https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1)
     - 🔥🔥🔥  [Qwen-72B-Chat](https://huggingface.co/Qwen/Qwen-72B-Chat)

diff --git a/README.zh.md b/README.zh.md
@@ -139,6 +139,8 @@ DB-GPT是一个开源的AI原生数据应用开发框架(AI Native Data App Deve
   海量模型支持，包括开源、API代理等几十种大语言模型。如LLaMA/LLaMA2、Baichuan、ChatGLM、文心、通义、智谱等。当前已支持如下模型: 
 
   - 新增支持模型
+    - 🔥🔥🔥  [gemma-7b-it](https://huggingface.co/google/gemma-7b-it)
+    - 🔥🔥🔥  [gemma-2b-it](https://huggingface.co/google/gemma-2b-it)
     - 🔥🔥🔥  [SOLAR-10.7B](https://huggingface.co/upstage/SOLAR-10.7B-Instruct-v1.0)
     - 🔥🔥🔥  [Mixtral-8x7B](https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1)
     - 🔥🔥🔥  [Qwen-72B-Chat](https://huggingface.co/Qwen/Qwen-72B-Chat)

diff --git a/dbgpt/configs/model_config.py b/dbgpt/configs/model_config.py
@@ -148,6 +148,10 @@ def get_device() -> str:
     # https://huggingface.co/01-ai/Yi-34B-Chat-4bits
     "yi-34b-chat-4bits": os.path.join(MODEL_PATH, "Yi-34B-Chat-4bits"),
     "yi-6b-chat": os.path.join(MODEL_PATH, "Yi-6B-Chat"),
+    # https://huggingface.co/google/gemma-7b-it
+    "gemma-7b-it": os.path.join(MODEL_PATH, "gemma-7b-it"),
+    # https://huggingface.co/google/gemma-2b-it
+    "gemma-2b-it": os.path.join(MODEL_PATH, "gemma-2b-it"),
 }
 
 EMBEDDING_MODEL_CONFIG = {

diff --git a/dbgpt/model/adapter/hf_adapter.py b/dbgpt/model/adapter/hf_adapter.py
@@ -39,19 +39,38 @@ def match(
     def do_match(self, lower_model_name_or_path: Optional[str] = None):
         raise NotImplementedError()
 
-    def load(self, model_path: str, from_pretrained_kwargs: dict):
+    def check_dependencies(self) -> None:
+        """Check if the dependencies are installed
+
+        Raises:
+            ValueError: If the dependencies are not installed
+        """
         try:
             import transformers
-            from transformers import AutoModel, AutoModelForCausalLM, AutoTokenizer
         except ImportError as exc:
             raise ValueError(
                 "Could not import depend python package "
                 "Please install it with `pip install transformers`."
             ) from exc
-        if not transformers.__version__ >= "4.34.0":
+        self.check_transformer_version(transformers.__version__)
+
+    def check_transformer_version(self, current_version: str) -> None:
+        if not current_version >= "4.34.0":
             raise ValueError(
                 "Current model (Load by NewHFChatModelAdapter) require transformers.__version__>=4.34.0"
             )
+
+    def load(self, model_path: str, from_pretrained_kwargs: dict):
+        try:
+            import transformers
+            from transformers import AutoModel, AutoModelForCausalLM, AutoTokenizer
+        except ImportError as exc:
+            raise ValueError(
+                "Could not import depend python package "
+                "Please install it with `pip install transformers`."
+            ) from exc
+        self.check_dependencies()
+
         revision = from_pretrained_kwargs.get("revision", "main")
         try:
             tokenizer = AutoTokenizer.from_pretrained(
@@ -149,6 +168,32 @@ def do_match(self, lower_model_name_or_path: Optional[str] = None):
         )
 
 
+class GemmaAdapter(NewHFChatModelAdapter):
+    """
+    https://huggingface.co/google/gemma-7b-it
+
+    TODO: There are problems with quantization.
+    """
+
+    support_4bit: bool = False
+    support_8bit: bool = False
+    support_system_message: bool = False
+
+    def check_transformer_version(self, current_version: str) -> None:
+        if not current_version >= "4.38.0":
+            raise ValueError(
+                "Gemma require transformers.__version__>=4.38.0, please upgrade your transformers package."
+            )
+
+    def do_match(self, lower_model_name_or_path: Optional[str] = None):
+        return (
+            lower_model_name_or_path
+            and "gemma-" in lower_model_name_or_path
+            and "it" in lower_model_name_or_path
+        )
+
+
 register_model_adapter(YiAdapter)
 register_model_adapter(Mixtral8x7BAdapter)
 register_model_adapter(SOLARAdapter)
+register_model_adapter(GemmaAdapter)