From a8776755a707bf1877f6cea5debce05546c621c1 Mon Sep 17 00:00:00 2001
From: Aymeric <aymeric.roucher@gmail.com>
Date: Fri, 10 Jan 2025 14:46:15 +0100
Subject: [PATCH 1/4] Halve import time by removing torch dependency

---
 docs/source/en/examples/multiagents.md |  6 +++---
 docs/source/en/tutorials/tools.md      |  4 ++--
 pyproject.toml                         | 17 +++++++++++----
 src/smolagents/default_tools.py        | 17 ++++++++++-----
 src/smolagents/models.py               | 30 +++++++++-----------------
 src/smolagents/tools.py                | 24 ++++++++++-----------
 src/smolagents/types.py                |  2 +-
 tests/test_types.py                    |  6 +++++-
 8 files changed, 57 insertions(+), 49 deletions(-)

diff --git a/docs/source/en/examples/multiagents.md b/docs/source/en/examples/multiagents.md
index 4ea4e51b..7901de2b 100644
--- a/docs/source/en/examples/multiagents.md
+++ b/docs/source/en/examples/multiagents.md
@@ -48,10 +48,10 @@ Run the line below to install the required dependencies:
 
 Let's login in order to call the HF Inference API:
 
-```py
-from huggingface_hub import notebook_login
+```
+from huggingface_hub import login
 
-notebook_login()
+login()
 ```
 
 ⚡️ Our agent will be powered by [Qwen/Qwen2.5-Coder-32B-Instruct](https://huggingface.co/Qwen/Qwen2.5-Coder-32B-Instruct) using `HfApiModel` class that uses HF's Inference API: the Inference API allows to quickly and easily run any OS model.
diff --git a/docs/source/en/tutorials/tools.md b/docs/source/en/tutorials/tools.md
index 014cd3b6..bcaaa0f4 100644
--- a/docs/source/en/tutorials/tools.md
+++ b/docs/source/en/tutorials/tools.md
@@ -177,7 +177,7 @@ agent.run("How many more blocks (also denoted as layers) are in BERT base encode
 
 ### Manage your agent's toolbox
 
-You can manage an agent's toolbox by adding or replacing a tool.
+You can manage an agent's toolbox by adding or replacing a tool in attribute `agent.tools`, since it is a standard dictionary.
 
 Let's add the `model_download_tool` to an existing agent initialized with only the default toolbox.
 
@@ -187,7 +187,7 @@ from smolagents import HfApiModel
 model = HfApiModel("Qwen/Qwen2.5-Coder-32B-Instruct")
 
 agent = CodeAgent(tools=[], model=model, add_base_tools=True)
-agent.tools.append(model_download_tool)
+agent.tools[model_download_tool.name] = model_download_tool
 ```
 Now we can leverage the new tool:
 
diff --git a/pyproject.toml b/pyproject.toml
index 978c1fb9..addfc0e4 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -12,9 +12,6 @@ authors = [
 readme = "README.md"
 requires-python = ">=3.10"
 dependencies = [
-  "torch",
-  "torchaudio",
-  "torchvision",
   "transformers>=4.0.0",
   "requests>=2.32.3",
   "rich>=13.9.4",
@@ -30,10 +27,22 @@ dependencies = [
 ]
 
 [tool.ruff]
-ignore = ["F403"]
+lint.ignore = ["F403"]
 
 [project.optional-dependencies]
+dev = [
+  "torch",
+  "torchaudio",
+  "torchvision",
+  "sqlalchemy",
+  "accelerate",
+  "soundfile",
+  "litellm>=1.55.10",
+]
 test = [
+  "torch",
+  "torchaudio",
+  "torchvision",
   "pytest>=8.1.0",
   "sqlalchemy",
   "ruff>=0.5.0",
diff --git a/src/smolagents/default_tools.py b/src/smolagents/default_tools.py
index 79539fda..75fe8d01 100644
--- a/src/smolagents/default_tools.py
+++ b/src/smolagents/default_tools.py
@@ -20,11 +20,9 @@
 from typing import Dict, Optional
 
 from huggingface_hub import hf_hub_download, list_spaces
-from transformers.models.whisper import (
-    WhisperForConditionalGeneration,
-    WhisperProcessor,
-)
-from transformers.utils import is_offline_mode
+
+
+from transformers.utils import is_offline_mode, is_torch_available
 
 from .local_python_executor import (
     BASE_BUILTIN_MODULES,
@@ -34,6 +32,15 @@
 from .tools import TOOL_CONFIG_FILE, PipelineTool, Tool
 from .types import AgentAudio
 
+if is_torch_available():
+    from transformers.models.whisper import (
+        WhisperForConditionalGeneration,
+        WhisperProcessor,
+    )
+else:
+    WhisperForConditionalGeneration = object
+    WhisperProcessor = object
+
 
 @dataclass
 class PreTool:
diff --git a/src/smolagents/models.py b/src/smolagents/models.py
index 403e9fa3..136aede5 100644
--- a/src/smolagents/models.py
+++ b/src/smolagents/models.py
@@ -22,7 +22,6 @@
 from enum import Enum
 from typing import Dict, List, Optional
 
-import torch
 from huggingface_hub import (
     InferenceClient,
     ChatCompletionOutputMessage,
@@ -35,6 +34,7 @@
     AutoTokenizer,
     StoppingCriteria,
     StoppingCriteriaList,
+    is_torch_available
 )
 import openai
 
@@ -58,7 +58,7 @@
     is_litellm_available = True
 except ImportError:
     is_litellm_available = False
-
+    
 
 class MessageRole(str, Enum):
     USER = "user"
@@ -147,29 +147,12 @@ def __init__(self):
         self.last_input_token_count = None
         self.last_output_token_count = None
 
-    def get_token_counts(self):
+    def get_token_counts(self) -> Dict[str, int]:
         return {
             "input_token_count": self.last_input_token_count,
             "output_token_count": self.last_output_token_count,
         }
 
-    def generate(
-        self,
-        messages: List[Dict[str, str]],
-        stop_sequences: Optional[List[str]] = None,
-        grammar: Optional[str] = None,
-        max_tokens: int = 1500,
-    ):
-        raise NotImplementedError
-
-    def get_tool_call(
-        self,
-        messages: List[Dict[str, str]],
-        available_tools: List[Tool],
-        stop_sequences,
-    ):
-        raise NotImplementedError
-
     def __call__(
         self,
         messages: List[Dict[str, str]],
@@ -256,6 +239,10 @@ def __call__(
         max_tokens: int = 1500,
         tools_to_call_from: Optional[List[Tool]] = None,
     ) -> str:
+        """
+        Gets an LLM output message for the given list of input messages.
+        If argument `tools_to_call_from` is passed, the model's tool calling options will be used to return a tool call.
+        """
         messages = get_clean_message_list(
             messages, role_conversions=tool_role_conversions
         )
@@ -293,6 +280,9 @@ class TransformersModel(Model):
 
     def __init__(self, model_id: Optional[str] = None, device: Optional[str] = None):
         super().__init__()
+        if not is_torch_available():
+            raise ImportError("Please install torch in order to use TransformersModel.")
+        import torch
         default_model_id = "HuggingFaceTB/SmolLM2-1.7B-Instruct"
         if model_id is None:
             model_id = default_model_id
diff --git a/src/smolagents/tools.py b/src/smolagents/tools.py
index 12d7d635..dafdde46 100644
--- a/src/smolagents/tools.py
+++ b/src/smolagents/tools.py
@@ -27,7 +27,6 @@
 from pathlib import Path
 from typing import Callable, Dict, Optional, Union, get_type_hints
 
-import torch
 from huggingface_hub import (
     create_repo,
     get_collection,
@@ -37,7 +36,6 @@
 )
 from huggingface_hub.utils import RepositoryNotFoundError
 from packaging import version
-from transformers import AutoProcessor
 from transformers.dynamic_module_utils import get_imports
 from transformers.utils import (
     TypeHintParsingException,
@@ -52,15 +50,16 @@
 from .types import ImageType, handle_agent_input_types, handle_agent_output_types
 from .utils import instance_to_source
 
-logger = logging.getLogger(__name__)
-
-
-if is_torch_available():
-    pass
+logger = logging.getLogger(__name__)    
 
 if is_accelerate_available():
-    pass
+    from accelerate import PartialState
+    from accelerate.utils import send_to_device
 
+if is_torch_available():
+    from transformers import AutoProcessor
+else:
+    AutoProcessor = object
 
 TOOL_CONFIG_FILE = "tool_config.json"
 
@@ -997,6 +996,8 @@ def __init__(
         if not is_torch_available():
             raise ImportError("Please install torch in order to use this tool.")
 
+        import torch
+
         if not is_accelerate_available():
             raise ImportError("Please install accelerate in order to use this tool.")
 
@@ -1026,8 +1027,6 @@ def setup(self):
         """
         Instantiates the `pre_processor`, `model` and `post_processor` if necessary.
         """
-        from accelerate import PartialState
-
         if isinstance(self.pre_processor, str):
             self.pre_processor = self.pre_processor_class.from_pretrained(
                 self.pre_processor, **self.hub_kwargs
@@ -1066,6 +1065,7 @@ def forward(self, inputs):
         """
         Sends the inputs through the `model`.
         """
+        import torch
         with torch.no_grad():
             return self.model(**inputs)
 
@@ -1076,6 +1076,7 @@ def decode(self, outputs):
         return self.post_processor(outputs)
 
     def __call__(self, *args, **kwargs):
+        import torch
         args, kwargs = handle_agent_input_types(*args, **kwargs)
 
         if not self.is_initialized:
@@ -1083,9 +1084,6 @@ def __call__(self, *args, **kwargs):
 
         encoded_inputs = self.encode(*args, **kwargs)
 
-        import torch
-        from accelerate.utils import send_to_device
-
         tensor_inputs = {
             k: v for k, v in encoded_inputs.items() if isinstance(v, torch.Tensor)
         }
diff --git a/src/smolagents/types.py b/src/smolagents/types.py
index dbc5d5bd..681d98b1 100644
--- a/src/smolagents/types.py
+++ b/src/smolagents/types.py
@@ -253,7 +253,7 @@ def to_string(self):
 INSTANCE_TYPE_MAPPING = {
     str: AgentText,
     ImageType: AgentImage,
-    torch.Tensor: AgentAudio,
+    Tensor: AgentAudio,
 }
 
 if is_torch_available():
diff --git a/tests/test_types.py b/tests/test_types.py
index e988e8b2..e9eb4138 100644
--- a/tests/test_types.py
+++ b/tests/test_types.py
@@ -18,7 +18,6 @@
 import uuid
 from pathlib import Path
 
-import torch
 from PIL import Image
 from transformers.testing_utils import (
     require_soundfile,
@@ -44,6 +43,8 @@ def get_new_path(suffix="") -> str:
 @require_torch
 class AgentAudioTests(unittest.TestCase):
     def test_from_tensor(self):
+        import torch
+    
         tensor = torch.rand(12, dtype=torch.float64) - 0.5
         agent_type = AgentAudio(tensor)
         path = str(agent_type.to_string())
@@ -61,6 +62,8 @@ def test_from_tensor(self):
         self.assertTrue(torch.allclose(tensor, torch.tensor(new_tensor), atol=1e-4))
 
     def test_from_string(self):
+        import torch
+
         tensor = torch.rand(12, dtype=torch.float64) - 0.5
         path = get_new_path(suffix=".wav")
         sf.write(path, tensor, 16000)
@@ -75,6 +78,7 @@ def test_from_string(self):
 @require_torch
 class AgentImageTests(unittest.TestCase):
     def test_from_tensor(self):
+        import torch
         tensor = torch.randint(0, 256, (64, 64, 3))
         agent_type = AgentImage(tensor)
         path = str(agent_type.to_string())

From 38816d5379519ad09025e25b48b6a2af43feccbe Mon Sep 17 00:00:00 2001
From: Aymeric <aymeric.roucher@gmail.com>
Date: Fri, 10 Jan 2025 14:53:37 +0100
Subject: [PATCH 2/4] Fix is_soundfile_available version

---
 src/smolagents/types.py | 6 +++---
 tests/test_types.py     | 6 +++---
 2 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/src/smolagents/types.py b/src/smolagents/types.py
index 681d98b1..a9730c1d 100644
--- a/src/smolagents/types.py
+++ b/src/smolagents/types.py
@@ -22,10 +22,10 @@
 import numpy as np
 import requests
 from transformers.utils import (
-    is_soundfile_availble,
     is_torch_available,
     is_vision_available,
 )
+from transformers.utils.import_utils import _is_package_available
 
 logger = logging.getLogger(__name__)
 
@@ -41,7 +41,7 @@
 else:
     Tensor = object
 
-if is_soundfile_availble():
+if _is_package_available("soundfile"):
     import soundfile as sf
 
 
@@ -189,7 +189,7 @@ class AgentAudio(AgentType, str):
     def __init__(self, value, samplerate=16_000):
         super().__init__(value)
 
-        if not is_soundfile_availble():
+        if not _is_package_available("soundfile"):
             raise ImportError("soundfile must be installed in order to handle audio.")
 
         self._path = None
diff --git a/tests/test_types.py b/tests/test_types.py
index e9eb4138..e720f951 100644
--- a/tests/test_types.py
+++ b/tests/test_types.py
@@ -24,13 +24,13 @@
     require_torch,
     require_vision,
 )
-from transformers.utils import (
-    is_soundfile_availble,
+from transformers.utils.import_utils import (
+    _is_package_available,
 )
 
 from smolagents.types import AgentAudio, AgentImage, AgentText
 
-if is_soundfile_availble():
+if _is_package_available("soundfile"):
     import soundfile as sf
 
 

From 11cbe9d6f57ccc906a29ffed75ce2ca3351d04d4 Mon Sep 17 00:00:00 2001
From: Aymeric <aymeric.roucher@gmail.com>
Date: Fri, 10 Jan 2025 14:55:42 +0100
Subject: [PATCH 3/4] Fix is_soundfile_available version

---
 src/smolagents/models.py | 5 +++--
 src/smolagents/tools.py  | 6 +++---
 tests/test_types.py      | 3 ++-
 3 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/src/smolagents/models.py b/src/smolagents/models.py
index 136aede5..fd686075 100644
--- a/src/smolagents/models.py
+++ b/src/smolagents/models.py
@@ -34,7 +34,7 @@
     AutoTokenizer,
     StoppingCriteria,
     StoppingCriteriaList,
-    is_torch_available
+    is_torch_available,
 )
 import openai
 
@@ -58,7 +58,7 @@
     is_litellm_available = True
 except ImportError:
     is_litellm_available = False
-    
+
 
 class MessageRole(str, Enum):
     USER = "user"
@@ -283,6 +283,7 @@ def __init__(self, model_id: Optional[str] = None, device: Optional[str] = None)
         if not is_torch_available():
             raise ImportError("Please install torch in order to use TransformersModel.")
         import torch
+
         default_model_id = "HuggingFaceTB/SmolLM2-1.7B-Instruct"
         if model_id is None:
             model_id = default_model_id
diff --git a/src/smolagents/tools.py b/src/smolagents/tools.py
index dafdde46..2638f542 100644
--- a/src/smolagents/tools.py
+++ b/src/smolagents/tools.py
@@ -50,7 +50,7 @@
 from .types import ImageType, handle_agent_input_types, handle_agent_output_types
 from .utils import instance_to_source
 
-logger = logging.getLogger(__name__)    
+logger = logging.getLogger(__name__)
 
 if is_accelerate_available():
     from accelerate import PartialState
@@ -996,8 +996,6 @@ def __init__(
         if not is_torch_available():
             raise ImportError("Please install torch in order to use this tool.")
 
-        import torch
-
         if not is_accelerate_available():
             raise ImportError("Please install accelerate in order to use this tool.")
 
@@ -1066,6 +1064,7 @@ def forward(self, inputs):
         Sends the inputs through the `model`.
         """
         import torch
+
         with torch.no_grad():
             return self.model(**inputs)
 
@@ -1077,6 +1076,7 @@ def decode(self, outputs):
 
     def __call__(self, *args, **kwargs):
         import torch
+
         args, kwargs = handle_agent_input_types(*args, **kwargs)
 
         if not self.is_initialized:
diff --git a/tests/test_types.py b/tests/test_types.py
index e720f951..aa58a8f0 100644
--- a/tests/test_types.py
+++ b/tests/test_types.py
@@ -44,7 +44,7 @@ def get_new_path(suffix="") -> str:
 class AgentAudioTests(unittest.TestCase):
     def test_from_tensor(self):
         import torch
-    
+
         tensor = torch.rand(12, dtype=torch.float64) - 0.5
         agent_type = AgentAudio(tensor)
         path = str(agent_type.to_string())
@@ -79,6 +79,7 @@ def test_from_string(self):
 class AgentImageTests(unittest.TestCase):
     def test_from_tensor(self):
         import torch
+
         tensor = torch.randint(0, 256, (64, 64, 3))
         agent_type = AgentImage(tensor)
         path = str(agent_type.to_string())

From 56ebbf1257fa8d5c6ed68e9fa71932bd2bd9e1a6 Mon Sep 17 00:00:00 2001
From: Aymeric <aymeric.roucher@gmail.com>
Date: Fri, 10 Jan 2025 14:57:57 +0100
Subject: [PATCH 4/4] Update quality check python to 3.12

---
 .github/workflows/quality.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/quality.yml b/.github/workflows/quality.yml
index 37749d75..2e4f5c67 100644
--- a/.github/workflows/quality.yml
+++ b/.github/workflows/quality.yml
@@ -13,7 +13,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v2
         with:
-          python-version: "3.10"
+          python-version: "3.12"
 
       # Setup venv
       # TODO: revisit when https://github.com/astral-sh/uv/issues/1526 is addressed.