InternLM · Jul 29, 2024 · Jul 31, 2024 · Aug 9, 2024 · Aug 9, 2024 · Aug 9, 2024
Showing 833 changed files with 51,070 additions and 27,077 deletions.
diff --git a/.pre-commit-config-zh-cn.yaml b/.pre-commit-config-zh-cn.yaml
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -1,27 +1,19 @@
-exclude: ^tests/data/|^xtuner/tools/model_converters/modeling_internlm2_reward/
+exclude: ^tests/data/|^xtuner/model/transformers_models/|^xtuner/tools/model_converters/modeling_internlm2_reward/|^xtuner/_lite/modelings/|^xtuner/_lite/accelerate/dispatches/huggingface/
 repos:
   - repo: https://github.com/PyCQA/flake8
     rev: 5.0.4
     hooks:
       - id: flake8
-        args: ["--exclude=xtuner/model/transformers_models/*"]
+        args: ["--max-line-length=119"]
   - repo: https://github.com/PyCQA/isort
-    rev: 5.11.5
+    rev: 5.12.0
     hooks:
       - id: isort
-  - repo: https://github.com/pre-commit/mirrors-yapf
-    rev: v0.32.0
-    hooks:
-      - id: yapf
-        exclude: 'xtuner/parallel/sequence/__init__.py'
   - repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v4.3.0
+    rev: v5.0.0
     hooks:
-      - id: trailing-whitespace
       - id: check-yaml
-      - id: end-of-file-fixer
       - id: requirements-txt-fixer
-      - id: double-quote-string-fixer
       - id: check-merge-conflict
       - id: fix-encoding-pragma
         args: ["--remove"]
@@ -45,9 +37,20 @@ repos:
     rev: v1.3.1
     hooks:
       - id: docformatter
-        args: ["--in-place", "--wrap-descriptions", "79"]
+        args: ["--in-place", "--wrap-descriptions", "119"]
+  - repo: https://github.com/open-mmlab/pre-commit-hooks
+    rev: v0.4.0
+    hooks:
+      - id: check-copyright
+        args: ["xtuner", "--excludes", "xtuner/_lite/modelings/", "xtuner/model/transformers_models/"]
+      - id: remove-improper-eol-in-cn-docs
   - repo: https://github.com/asottile/pyupgrade
     rev: v3.0.0
     hooks:
       - id: pyupgrade
         args: ["--py36-plus"]
+
+  - repo: https://github.com/psf/black
+    rev: 23.9.1
+    hooks:
+      - id: black
diff --git a/README.md b/README.md
@@ -38,7 +38,9 @@ English | [简体中文](README_zh-CN.md)
 </div>
 
 ## 🎉 News
-
+- **\[2025/02\]** Support [OREAL](https://github.com/InternLM/OREAL), a new RL method for math reasoning!
+- **\[2025/01\]** Support [InternLM3 8B Instruct](https://huggingface.co/internlm/internlm3-8b-instruct)!
+- **\[2024/07\]** Support [MiniCPM](xtuner/configs/minicpm/) models!
 - **\[2024/07\]** Support [DPO](https://github.com/InternLM/xtuner/tree/main/xtuner/configs/dpo), [ORPO](https://github.com/InternLM/xtuner/tree/main/xtuner/configs/orpo) and [Reward Model](https://github.com/InternLM/xtuner/tree/main/xtuner/configs/reward_model) training with packed data and sequence parallel! See [documents](https://xtuner.readthedocs.io/en/latest/dpo/overview.html) for more details.
 - **\[2024/07\]** Support [InternLM 2.5](xtuner/configs/internlm/internlm2_5_chat_7b/) models!
 - **\[2024/06\]** Support [DeepSeek V2](xtuner/configs/deepseek/deepseek_v2_chat/) models! **2x faster!**
@@ -113,6 +115,7 @@ XTuner is an efficient, flexible and full-featured toolkit for fine-tuning large
   <li><a href="https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1">Mixtral</a></li>
   <li><a href="https://huggingface.co/deepseek-ai/DeepSeek-V2-Chat">DeepSeek V2</a></li>
   <li><a href="https://huggingface.co/google">Gemma</a></li>
+  <li><a href="https://huggingface.co/openbmb">MiniCPM</a></li>
   <li>...</li>
 </ul>
 </td>

diff --git a/README_zh-CN.md b/README_zh-CN.md
@@ -39,6 +39,7 @@
 
 ## 🎉 更新
 
+- **\[2024/07\]** 支持 [MiniCPM](xtuner/configs/minicpm/) 模型!
 - **\[2024/07\]** 支持训练 [DPO](https://github.com/InternLM/xtuner/tree/main/xtuner/configs/dpo)， [ORPO](https://github.com/InternLM/xtuner/tree/main/xtuner/configs/orpo) 还有 [Reward Model](https://github.com/InternLM/xtuner/tree/main/xtuner/configs/reward_model) ! 并且能够支持打包数据以及序列并行功能！ 请参考 [文档](https://xtuner.readthedocs.io/zh-cn/latest/dpo/overview.html) 了解更多信息。
 - **\[2024/07\]** 支持 [InternLM 2.5](xtuner/configs/internlm/internlm2_5_chat_7b/) 模型!
 - **\[2024/06\]** 支持 [DeepSeek V2](xtuner/configs/deepseek/deepseek_v2_chat/) models! **训练速度提升一倍！**
@@ -113,6 +114,7 @@ XTuner 是一个高效、灵活、全能的轻量化大模型微调工具库。
   <li><a href="https://huggingface.co/mistralai/Mixtral-8x7B-Instruct-v0.1">Mixtral</a></li>
   <li><a href="https://huggingface.co/deepseek-ai/DeepSeek-V2-Chat">DeepSeek V2</a></li>
   <li><a href="https://huggingface.co/google">Gemma</a></li>
+  <li><a href="https://huggingface.co/openbmb">MiniCPM</a></li>
   <li>...</li>
 </ul>
 </td>

diff --git a/docs/en/conf.py b/docs/en/conf.py
@@ -15,19 +15,19 @@
 
 from sphinx.ext import autodoc
 
-sys.path.insert(0, os.path.abspath('../..'))
+sys.path.insert(0, os.path.abspath("../.."))
 
 # -- Project information -----------------------------------------------------
 
-project = 'XTuner'
-copyright = '2024, XTuner Contributors'
-author = 'XTuner Contributors'
+project = "XTuner"
+copyright = "2024, XTuner Contributors"
+author = "XTuner Contributors"
 
 # The full version, including alpha/beta/rc tags
-version_file = '../../xtuner/version.py'
+version_file = "../../xtuner/version.py"
 with open(version_file) as f:
-    exec(compile(f.read(), version_file, 'exec'))
-__version__ = locals()['__version__']
+    exec(compile(f.read(), version_file, "exec"))
+__version__ = locals()["__version__"]
 # The short X.Y version
 version = __version__
 # The full version, including alpha/beta/rc tags
@@ -39,41 +39,41 @@
 # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
 # ones.
 extensions = [
-    'sphinx.ext.napoleon',
-    'sphinx.ext.viewcode',
-    'sphinx.ext.intersphinx',
-    'sphinx_copybutton',
-    'sphinx.ext.autodoc',
-    'sphinx.ext.autosummary',
-    'myst_parser',
-    'sphinxarg.ext',
+    "sphinx.ext.napoleon",
+    "sphinx.ext.viewcode",
+    "sphinx.ext.intersphinx",
+    "sphinx_copybutton",
+    "sphinx.ext.autodoc",
+    "sphinx.ext.autosummary",
+    "myst_parser",
+    "sphinxarg.ext",
 ]
 
 # Add any paths that contain templates here, relative to this directory.
-templates_path = ['_templates']
+templates_path = ["_templates"]
 
 # List of patterns, relative to source directory, that match files and
 # directories to ignore when looking for source files.
 # This pattern also affects html_static_path and html_extra_path.
-exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store']
+exclude_patterns = ["_build", "Thumbs.db", ".DS_Store"]
 
 # Exclude the prompt "$" when copying code
-copybutton_prompt_text = r'\$ '
+copybutton_prompt_text = r"\$ "
 copybutton_prompt_is_regexp = True
 
-language = 'en'
+language = "en"
 
 # -- Options for HTML output -------------------------------------------------
 
 # The theme to use for HTML and HTML Help pages.  See the documentation for
 # a list of builtin themes.
 #
-html_theme = 'sphinx_book_theme'
-html_logo = '_static/image/logo.png'
+html_theme = "sphinx_book_theme"
+html_logo = "_static/image/logo.png"
 html_theme_options = {
-    'path_to_docs': 'docs/en',
-    'repository_url': 'https://github.com/InternLM/xtuner',
-    'use_repository_button': True,
+    "path_to_docs": "docs/en",
+    "repository_url": "https://github.com/InternLM/xtuner",
+    "use_repository_button": True,
 }
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
@@ -82,24 +82,24 @@
 
 # Mock out external dependencies here.
 autodoc_mock_imports = [
-    'cpuinfo',
-    'torch',
-    'transformers',
-    'psutil',
-    'prometheus_client',
-    'sentencepiece',
-    'vllm.cuda_utils',
-    'vllm._C',
-    'numpy',
-    'tqdm',
+    "cpuinfo",
+    "torch",
+    "transformers",
+    "psutil",
+    "prometheus_client",
+    "sentencepiece",
+    "vllm.cuda_utils",
+    "vllm._C",
+    "numpy",
+    "tqdm",
 ]
 
 
 class MockedClassDocumenter(autodoc.ClassDocumenter):
     """Remove note about base class when a class is derived from object."""
 
     def add_line(self, line: str, source: str, *lineno: int) -> None:
-        if line == '   Bases: :py:class:`object`':
+        if line == "   Bases: :py:class:`object`":
             return
         super().add_line(line, source, *lineno)
 

diff --git a/docs/zh_cn/conf.py b/docs/zh_cn/conf.py
@@ -15,19 +15,19 @@
 
 from sphinx.ext import autodoc
 
-sys.path.insert(0, os.path.abspath('../..'))
+sys.path.insert(0, os.path.abspath("../.."))
 
 # -- Project information -----------------------------------------------------
 
-project = 'XTuner'
-copyright = '2024, XTuner Contributors'
-author = 'XTuner Contributors'
+project = "XTuner"
+copyright = "2024, XTuner Contributors"
+author = "XTuner Contributors"
 
 # The full version, including alpha/beta/rc tags
-version_file = '../../xtuner/version.py'
+version_file = "../../xtuner/version.py"
 with open(version_file) as f:
-    exec(compile(f.read(), version_file, 'exec'))
-__version__ = locals()['__version__']
+    exec(compile(f.read(), version_file, "exec"))
+__version__ = locals()["__version__"]
 # The short X.Y version
 version = __version__
 # The full version, including alpha/beta/rc tags
@@ -39,41 +39,41 @@
 # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
 # ones.
 extensions = [
-    'sphinx.ext.napoleon',
-    'sphinx.ext.viewcode',
-    'sphinx.ext.intersphinx',
-    'sphinx_copybutton',
-    'sphinx.ext.autodoc',
-    'sphinx.ext.autosummary',
-    'myst_parser',
-    'sphinxarg.ext',
+    "sphinx.ext.napoleon",
+    "sphinx.ext.viewcode",
+    "sphinx.ext.intersphinx",
+    "sphinx_copybutton",
+    "sphinx.ext.autodoc",
+    "sphinx.ext.autosummary",
+    "myst_parser",
+    "sphinxarg.ext",
 ]
 
 # Add any paths that contain templates here, relative to this directory.
-templates_path = ['_templates']
+templates_path = ["_templates"]
 
 # List of patterns, relative to source directory, that match files and
 # directories to ignore when looking for source files.
 # This pattern also affects html_static_path and html_extra_path.
-exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store']
+exclude_patterns = ["_build", "Thumbs.db", ".DS_Store"]
 
 # Exclude the prompt "$" when copying code
-copybutton_prompt_text = r'\$ '
+copybutton_prompt_text = r"\$ "
 copybutton_prompt_is_regexp = True
 
-language = 'zh_CN'
+language = "zh_CN"
 
 # -- Options for HTML output -------------------------------------------------
 
 # The theme to use for HTML and HTML Help pages.  See the documentation for
 # a list of builtin themes.
 #
-html_theme = 'sphinx_book_theme'
-html_logo = '_static/image/logo.png'
+html_theme = "sphinx_book_theme"
+html_logo = "_static/image/logo.png"
 html_theme_options = {
-    'path_to_docs': 'docs/zh_cn',
-    'repository_url': 'https://github.com/InternLM/xtuner',
-    'use_repository_button': True,
+    "path_to_docs": "docs/zh_cn",
+    "repository_url": "https://github.com/InternLM/xtuner",
+    "use_repository_button": True,
 }
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
@@ -82,24 +82,24 @@
 
 # Mock out external dependencies here.
 autodoc_mock_imports = [
-    'cpuinfo',
-    'torch',
-    'transformers',
-    'psutil',
-    'prometheus_client',
-    'sentencepiece',
-    'vllm.cuda_utils',
-    'vllm._C',
-    'numpy',
-    'tqdm',
+    "cpuinfo",
+    "torch",
+    "transformers",
+    "psutil",
+    "prometheus_client",
+    "sentencepiece",
+    "vllm.cuda_utils",
+    "vllm._C",
+    "numpy",
+    "tqdm",
 ]
 
 
 class MockedClassDocumenter(autodoc.ClassDocumenter):
     """Remove note about base class when a class is derived from object."""
 
     def add_line(self, line: str, source: str, *lineno: int) -> None:
-        if line == '   Bases: :py:class:`object`':
+        if line == "   Bases: :py:class:`object`":
             return
         super().add_line(line, source, *lineno)