AgentOps-AI · teocns · Dec 2, 2024 · Nov 21, 2024 · Nov 22, 2024 · Nov 22, 2024
diff --git a/agentops/client.py b/agentops/client.py
@@ -5,29 +5,29 @@
     Client: Provides methods to interact with the AgentOps service.
 """
 
-import inspect
 import atexit
+import inspect
 import logging
 import os
 import signal
 import sys
 import threading
 import traceback
 from decimal import Decimal
+from functools import cached_property
+from typing import List, Optional, Tuple, Union
 from uuid import UUID, uuid4
-from typing import Optional, List, Union, Tuple
+
 from termcolor import colored
 
-from .event import Event, ErrorEvent
-from .singleton import (
-    conditional_singleton,
-)
-from .session import Session, active_sessions
+from .config import Configuration
+from .event import ErrorEvent, Event
 from .host_env import get_host_env
+from .llms import LlmTracker
 from .log_config import logger
 from .meta_client import MetaClient
-from .config import Configuration
-from .llms import LlmTracker
+from .session import Session, active_sessions
+from .singleton import conditional_singleton
 
 
 @conditional_singleton
@@ -39,6 +39,7 @@ def __init__(self):
         self._sessions: List[Session] = active_sessions
         self._config = Configuration()
         self._pre_init_queue = {"agents": []}
+        self._host_env = None  # Cache host env data
 
         self.configure(
             api_key=os.environ.get("AGENTOPS_API_KEY"),
@@ -111,6 +112,7 @@ def initialize(self) -> Union[Session, None]:
     def _initialize_autogen_logger(self) -> None:
         try:
             import autogen
+
             from .partners.autogen_logger import AutogenLogger
 
             autogen.runtime_logging.start(logger=AutogenLogger())
@@ -224,7 +226,7 @@ def start_session(
         session = Session(
             session_id=session_id,
             tags=list(session_tags),
-            host_env=get_host_env(self._config.env_data_opt_out),
+            host_env=self.host_env,
             config=self._config,
         )
 
@@ -430,3 +432,8 @@ def api_key(self):
     @property
     def parent_key(self):
         return self._config.parent_key
+
+    @cached_property
+    def host_env(self):
+        """Cache and reuse host environment data"""
+        return get_host_env(self._config.env_data_opt_out)
diff --git a/agentops/event.py b/agentops/event.py
@@ -82,6 +82,7 @@ class LLMEvent(Event):
     prompt_tokens: Optional[int] = None
     completion: Union[str, object] = None
     completion_tokens: Optional[int] = None
+    cost: Optional[float] = None
     model: Optional[str] = None
 
 

diff --git a/agentops/http_client.py b/agentops/http_client.py
@@ -1,7 +1,9 @@
 from enum import Enum
-from typing import Optional
-from requests.adapters import Retry, HTTPAdapter
+from typing import Optional, Dict, Any
+
 import requests
+from requests.adapters import HTTPAdapter, Retry
+import json
 
 from .exceptions import ApiServerException
 
@@ -54,33 +56,79 @@
 
 
 class HttpClient:
-    @staticmethod
+    _session: Optional[requests.Session] = None
+
+    @classmethod
+    def get_session(cls) -> requests.Session:
+        """Get or create the global session with optimized connection pooling"""
+        if cls._session is None:
+            cls._session = requests.Session()
+
+            # Configure connection pooling
+            adapter = requests.adapters.HTTPAdapter(
+                pool_connections=15,  # Number of connection pools
+                pool_maxsize=256,  # Connections per pool
+                max_retries=Retry(total=3, backoff_factor=0.1, status_forcelist=[500, 502, 503, 504]),
+            )
+
+            # Mount adapter for both HTTP and HTTPS
+            cls._session.mount("http://", adapter)
+            cls._session.mount("https://", adapter)
+
+            # Set default headers
+            cls._session.headers.update(
+                {
+                    "Connection": "keep-alive",
+                    "Keep-Alive": "timeout=10, max=1000",
+                    "Content-Type": "application/json",
+                }
+            )
+
+        return cls._session
+
+    @classmethod
+    def _prepare_headers(
+        cls,
+        api_key: Optional[str] = None,
+        parent_key: Optional[str] = None,
+        jwt: Optional[str] = None,
+        custom_headers: Optional[dict] = None,
+    ) -> dict:
+        """Prepare headers for the request"""
+        headers = JSON_HEADER.copy()
+
+        if api_key is not None:
+            headers["X-Agentops-Api-Key"] = api_key
+
+        if parent_key is not None:
+            headers["X-Agentops-Parent-Key"] = parent_key
+
+        if jwt is not None:
+            headers["Authorization"] = f"Bearer {jwt}"
+
+        if custom_headers is not None:
+            headers.update(custom_headers)
+
+        return headers
+
+    @classmethod
     def post(
+        cls,
         url: str,
         payload: bytes,
         api_key: Optional[str] = None,
         parent_key: Optional[str] = None,
         jwt: Optional[str] = None,
-        header=None,
+        header: Optional[Dict[str, str]] = None,
     ) -> Response:
+        """Make HTTP POST request using connection pooling"""
         result = Response()
         try:
-            # Create request session with retries configured
-            request_session = requests.Session()
-            request_session.mount(url, HTTPAdapter(max_retries=retry_config))
-
-            if api_key is not None:
-                JSON_HEADER["X-Agentops-Api-Key"] = api_key
-
-            if parent_key is not None:
-                JSON_HEADER["X-Agentops-Parent-Key"] = parent_key
-
-            if jwt is not None:
-                JSON_HEADER["Authorization"] = f"Bearer {jwt}"
-
-            res = request_session.post(url, data=payload, headers=JSON_HEADER, timeout=20)
-
+            headers = cls._prepare_headers(api_key, parent_key, jwt, header)
+            session = cls.get_session()
+            res = session.post(url, data=payload, headers=headers, timeout=20)
             result.parse(res)
+
         except requests.exceptions.Timeout:
             result.code = 408
             result.status = HttpStatus.TIMEOUT
@@ -112,28 +160,22 @@
 
         return result
 
-    @staticmethod
+    @classmethod
     def get(
+        cls,
         url: str,
         api_key: Optional[str] = None,
         jwt: Optional[str] = None,
-        header=None,
+        header: Optional[Dict[str, str]] = None,
     ) -> Response:
+        """Make HTTP GET request using connection pooling"""
         result = Response()
         try:
-            # Create request session with retries configured
-            request_session = requests.Session()
-            request_session.mount(url, HTTPAdapter(max_retries=retry_config))
-
-            if api_key is not None:
-                JSON_HEADER["X-Agentops-Api-Key"] = api_key
-
-            if jwt is not None:
-                JSON_HEADER["Authorization"] = f"Bearer {jwt}"
-
-            res = request_session.get(url, headers=JSON_HEADER, timeout=20)
-
+            headers = cls._prepare_headers(api_key, None, jwt, header)
+            session = cls.get_session()
+            res = session.get(url, headers=headers, timeout=20)
             result.parse(res)
+
         except requests.exceptions.Timeout:
             result.code = 408
             result.status = HttpStatus.TIMEOUT

diff --git a/agentops/llms/anthropic.py b/agentops/llms/anthropic.py
@@ -137,7 +137,7 @@ async def async_generator():
 
                 The raw response has the following structure:
                 {
-                    'id': str,              # Message ID (e.g. 'msg_018Gk9N2pcWaYLS7mxXbPD5i') 
+                    'id': str,              # Message ID (e.g. 'msg_018Gk9N2pcWaYLS7mxXbPD5i')
                     'type': str,            # Type of response (e.g. 'message')
                     'role': str,            # Role of responder (e.g. 'assistant')
                     'model': str,           # Model used (e.g. 'claude-3-5-sonnet-20241022')
@@ -151,7 +151,7 @@ async def async_generator():
                 }
 
                 Note: We import Anthropic types here since the package must be installed
-                for raw responses to be available; doing so in the global scope would 
+                for raw responses to be available; doing so in the global scope would
                 result in dependencies error since this provider is not lazily imported (tests fail)
                 """
                 from anthropic import APIResponse
@@ -167,7 +167,7 @@ async def async_generator():
                 llm_event.model = response_data["model"]
                 llm_event.completion = {
                     "role": response_data.get("role"),
-                    "content": response_data.get("content")[0].get("text") if response_data.get("content") else "",
+                    "content": (response_data.get("content")[0].get("text") if response_data.get("content") else ""),
                 }
                 if usage := response_data.get("usage"):
                     llm_event.prompt_tokens = usage.get("input_tokens")

diff --git a/agentops/partners/autogen_logger.py b/agentops/partners/autogen_logger.py
@@ -10,9 +10,9 @@
 from openai.types.chat import ChatCompletion
 
 from autogen.logger.base_logger import BaseLogger, LLMConfig
-from autogen.logger.logger_utils import get_current_ts, to_dict
 
 from agentops.enums import EndState
+from agentops.helpers import get_ISO_time
 
 from agentops import LLMEvent, ToolEvent, ActionEvent
 from uuid import uuid4
@@ -55,17 +55,19 @@ def log_chat_completion(
         start_time: str,
     ) -> None:
         """Records an LLMEvent to AgentOps session"""
-        end_time = get_current_ts()
 
         completion = response.choices[len(response.choices) - 1]
 
+        # Note: Autogen tokens are not included in the request and function call tokens are not counted in the completion
         llm_event = LLMEvent(
             prompt=request["messages"],
             completion=completion.message,
             model=response.model,
+            cost=cost,
+            returns=completion.message.to_json(),
         )
         llm_event.init_timestamp = start_time
-        llm_event.end_timestamp = end_time
+        llm_event.end_timestamp = get_ISO_time()
         llm_event.agent_id = self._get_agentops_id_from_agent(str(id(agent)))
         agentops.record(llm_event)