Add support for OpenTelemetry instrumentation 📊 (#200)

2025-01-15 12:10:52 +01:00 · 2025-01-15 12:10:52 +01:00 · 450934ce79
parent ce1cd6d906
commit 450934ce79
2 changed files with 59 additions and 5 deletions
--- a/src/smolagents/models.py
+++ b/src/smolagents/models.py
@ -14,7 +14,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-from dataclasses import dataclass
+from dataclasses import dataclass, asdict
 import json
 import logging
 import os
@ -54,12 +54,29 @@ if _is_package_available("litellm"):
    import litellm


+def get_dict_from_nested_dataclasses(obj):
+    def convert(obj):
+        if hasattr(obj, "__dataclass_fields__"):
+            return {k: convert(v) for k, v in asdict(obj).items()}
+        return obj
+
+    return convert(obj)
+
+
@dataclass
 class ChatMessageToolCallDefinition:
    arguments: Any
    name: str
    description: Optional[str] = None

+    @classmethod
+    def from_hf_api(cls, tool_call_definition) -> "ChatMessageToolCallDefinition":
+        return cls(
+            arguments=tool_call_definition.arguments,
+            name=tool_call_definition.name,
+            description=tool_call_definition.description,
+        )
+

@dataclass
 class ChatMessageToolCall:
@ -67,6 +84,14 @@ class ChatMessageToolCall:
    id: str
    type: str

+    @classmethod
+    def from_hf_api(cls, tool_call) -> "ChatMessageToolCall":
+        return cls(
+            function=ChatMessageToolCallDefinition.from_hf_api(tool_call.function),
+            id=tool_call.id,
+            type=tool_call.type,
+        )
+

@dataclass
 class ChatMessage:
@ -74,6 +99,19 @@ class ChatMessage:
    content: Optional[str] = None
    tool_calls: Optional[List[ChatMessageToolCall]] = None

+    def model_dump_json(self):
+        return json.dumps(get_dict_from_nested_dataclasses(self))
+
+    @classmethod
+    def from_hf_api(cls, message) -> "ChatMessage":
+        tool_calls = None
+        if getattr(message, "tool_calls", None) is not None:
+            tool_calls = [
+                ChatMessageToolCall.from_hf_api(tool_call)
+                for tool_call in message.tool_calls
+            ]
+        return cls(role=message.role, content=message.content, tool_calls=tool_calls)
+

 class MessageRole(str, Enum):
    USER = "user"
@ -283,7 +321,7 @@ class HfApiModel(Model):
            )
        self.last_input_token_count = response.usage.prompt_tokens
        self.last_output_token_count = response.usage.completion_tokens
-        return response.choices[0].message
+        return ChatMessage.from_hf_api(response.choices[0].message)


 class TransformersModel(Model):
@ -315,14 +353,18 @@ class TransformersModel(Model):
        logger.info(f"Using device: {self.device}")
        try:
            self.tokenizer = AutoTokenizer.from_pretrained(model_id)
-            self.model = AutoModelForCausalLM.from_pretrained(model_id, device_map=self.device)
+            self.model = AutoModelForCausalLM.from_pretrained(
+                model_id, device_map=self.device
+            )
        except Exception as e:
            logger.warning(
                f"Failed to load tokenizer and model for {model_id=}: {e}. Loading default tokenizer and model instead from {default_model_id=}."
            )
            self.model_id = default_model_id
            self.tokenizer = AutoTokenizer.from_pretrained(default_model_id)
-            self.model = AutoModelForCausalLM.from_pretrained(model_id, device_map=self.device)
+            self.model = AutoModelForCausalLM.from_pretrained(
+                model_id, device_map=self.device
+            )

    def make_stopping_criteria(self, stop_sequences: List[str]) -> StoppingCriteriaList:
        class StopOnStrings(StoppingCriteria):
@ -551,4 +593,5 @@ __all__ = [
    "HfApiModel",
    "LiteLLMModel",
    "OpenAIServerModel",
+    "ChatMessage",
 ]
--- a/tests/test_models.py
+++ b/tests/test_models.py
@ -13,9 +13,10 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 import unittest
+import json
 from typing import Optional

-from smolagents import models, tool
+from smolagents import models, tool, ChatMessage, HfApiModel


 class ModelTests(unittest.TestCase):
@ -38,3 +39,13 @@ class ModelTests(unittest.TestCase):
                "properties"
            ]["celsius"]
        )
+
+    def test_chatmessage_has_model_dumps_json(self):
+        message = ChatMessage("user", "Hello!")
+        data = json.loads(message.model_dump_json())
+        assert data["content"] == "Hello!"
+
+    def test_get_hfapi_message_no_tool(self):
+        model = HfApiModel()
+        messages = [{"role": "user", "content": "Hello!"}]
+        model(messages, stop_sequences=["great"])