From 132f9f3e6a676236345281c493bdb5b33b0d9c33 Mon Sep 17 00:00:00 2001 From: Aymeric Date: Fri, 27 Dec 2024 17:19:07 +0100 Subject: [PATCH] Update torchvision --- README.md | 2 +- pyproject.toml | 1 + src/smolagents/models.py | 2 +- 3 files changed, 3 insertions(+), 2 deletions(-) diff --git a/README.md b/README.md index 214843b..8e61d49 100644 --- a/README.md +++ b/README.md @@ -66,7 +66,7 @@ Especially, since code execution can be a security concern (arbitrary code execu ## How smol is it really? We strived to keep abstractions to a strict minimum: the main code in `agents.py` is only ~1,000 lines of code. -Still, we implement several types of agents: `CodeAgent` writes its actions as Python code snippets, and the more classic `ToolCallingAgent` that leverages built-in tool calling methods. +Still, we implement several types of agents: `CodeAgent` writes its actions as Python code snippets, and the more classic `ToolCallingAgent` leverages built-in tool calling methods. By the way, why use a framework at all? Well, because a big part of this stuff is non-trivial. For instance, the code agent has to keep a consistent format for code throughout its system prompt, its parser, the execution. So our framework handles this complexity for you. But of course we still encourage you to hack into the source code and use only the bits that you need, to the exclusion of everything else! diff --git a/pyproject.toml b/pyproject.toml index 210df30..f0dc9dd 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -26,6 +26,7 @@ dependencies = [ "e2b-code-interpreter>=1.0.3", "torch>=2.5.1", "litellm>=1.55.10", + "torchvision>=0.20.1", ] [project.optional-dependencies] diff --git a/src/smolagents/models.py b/src/smolagents/models.py index f3763d1..13e0f52 100644 --- a/src/smolagents/models.py +++ b/src/smolagents/models.py @@ -219,7 +219,7 @@ class HfApiModel(Model): def __init__( self, - model_id: str = "meta-llama/Llama-3.3-70B-Instruct", + model_id: str = "Qwen/Qwen2.5-Coder-32B-Instruct", token: Optional[str] = None, timeout: Optional[int] = 120, ):