Source code for autogen_core.models._model_client

from __future__ import annotations

import warnings
from abc import ABC, abstractmethod
from typing import Literal, Mapping, Optional, Sequence, TypeAlias

from typing_extensions import Any, AsyncGenerator, Required, TypedDict, Union, deprecated

from .. import CancellationToken
from .._component_config import ComponentLoader
from ..tools import Tool, ToolSchema
from ._types import CreateResult, LLMMessage, RequestUsage


[docs] class ModelFamily: """A model family is a group of models that share similar characteristics from a capabilities perspective. This is different to discrete supported features such as vision, function calling, and JSON output. This namespace class holds constants for the model families that AutoGen understands. Other families definitely exist and can be represented by a string, however, AutoGen will treat them as unknown.""" GPT_4O = "gpt-4o" O1 = "o1" GPT_4 = "gpt-4" GPT_35 = "gpt-35" UNKNOWN = "unknown" ANY: TypeAlias = Literal["gpt-4o", "o1", "gpt-4", "gpt-35", "unknown"] def __new__(cls, *args: Any, **kwargs: Any) -> ModelFamily: raise TypeError(f"{cls.__name__} is a namespace class and cannot be instantiated.")
[docs] @deprecated("Use the ModelInfo class instead ModelCapabilities.") class ModelCapabilities(TypedDict, total=False): vision: Required[bool] function_calling: Required[bool] json_output: Required[bool]
[docs] class ModelInfo(TypedDict, total=False): vision: Required[bool] """True if the model supports vision, aka image input, otherwise False.""" function_calling: Required[bool] """True if the model supports function calling, otherwise False.""" json_output: Required[bool] """True if the model supports json output, otherwise False. Note: this is different to structured json.""" family: Required[ModelFamily.ANY | str] """Model family should be one of the constants from :py:class:`ModelFamily` or a string representing an unknown model family."""
[docs] class ChatCompletionClient(ABC, ComponentLoader): # Caching has to be handled internally as they can depend on the create args that were stored in the constructor
[docs] @abstractmethod async def create(
self, messages: Sequence[LLMMessage], *, tools: Sequence[Tool | ToolSchema] = [], # None means do not override the default # A value means to override the client default - often specified in the constructor json_output: Optional[bool] = None, extra_create_args: Mapping[str, Any] = {}, cancellation_token: Optional[CancellationToken] = None, ) -> CreateResult: ...
[docs] @abstractmethod def create_stream(
self, messages: Sequence[LLMMessage], *, tools: Sequence[Tool | ToolSchema] = [], # None means do not override the default # A value means to override the client default - often specified in the constructor json_output: Optional[bool] = None, extra_create_args: Mapping[str, Any] = {}, cancellation_token: Optional[CancellationToken] = None, ) -> AsyncGenerator[Union[str, CreateResult], None]: ...
[docs] @abstractmethod def actual_usage(self) -> RequestUsage: ...
[docs] @abstractmethod def total_usage(self) -> RequestUsage: ...
[docs] @abstractmethod def count_tokens(self, messages: Sequence[LLMMessage], *, tools: Sequence[Tool | ToolSchema] = []) -> int: ...
[docs] @abstractmethod def remaining_tokens(self, messages: Sequence[LLMMessage], *, tools: Sequence[Tool | ToolSchema] = []) -> int: ...
# Deprecated @property @abstractmethod def capabilities(self) -> ModelCapabilities: ... # type: ignore @property @abstractmethod def model_info(self) -> ModelInfo: warnings.warn( "Model client in use does not implement model_info property. Falling back to capabilities property. The capabilities property is deprecated and will be removed soon, please implement model_info instead in the model client class.", stacklevel=2, ) base_info: ModelInfo = self.capabilities # type: ignore base_info["family"] = ModelFamily.UNKNOWN return base_info