`afnio.models.model`

`afnio.models.model.BaseModel`

Bases: ABC

An abstraction for a model.

Source code in afnio/models/model.py

class BaseModel(ABC):
    """
    An abstraction for a model.
    """

    def __init__(
        self,
        provider: str = None,
        config: Optional[dict] = None,
        usage: Optional[dict] = None,
    ):
        """Initializes the `BaseModel` instance.

        Args:
            provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
            config: A dictionary containing provider-specific configuration parameters,
                such as model name, temperature, max tokens, etc. This is an internal
                implementation detail used by `afnio` to create a `BaseModel` instance
                on the backend, and is not intended to be set directly by users.
                Subclasses can define their own expected configuration parameters and
                should ensure that they are included in this dictionary when
                initializing the base class.
            usage: A dictionary to track token usage and cost information. It is
                typically initialized by subclasses with provider-specific usage metrics
                and cost structure.
        """
        self.provider = provider
        self._config = config or {}
        self._usage = usage or {}
        self._usage.update(copy.deepcopy(INITIAL_COST))
        self.model_id = None

        # Request user consent before sending sensitive info to the server
        check_consent()

        try:
            # Get the singleton websocket client
            _, ws_client = get_default_clients()

            payload = {
                "class_type": self.__class__.__name__,
                "provider": self.provider,
                "config": self.get_config(),
                "usage": self.get_usage(),
            }
            response = run_in_background_loop(ws_client.call("create_model", payload))
            if "error" in response:
                raise RuntimeError(
                    response["error"]["data"].get("exception", response["error"])
                )

            logger.debug(f"LM model created and shared with the server: {self!r}")

            model_id = response["result"].get("model_id")
            if not model_id:
                raise RuntimeError(
                    f"Server did not return a model_id "
                    f"for payload: {payload!r}, response: {response!r}"
                )
            self.model_id = model_id
            register_model(self)
        except Exception as e:
            logger.error(f"Failed to share LM model with the server: {e}")
            raise

    def get_provider(self) -> Optional[str]:
        """Returns the model provider name.

        Returns:
            provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`),
                or None if not set.
        """
        return self.provider

    def get_config(self) -> Dict[str, Union[str, float, int]]:
        """Returns the model configuration.

        This includes the model name, temperature, max tokens, and other
        parameters that are used to configure the model's behavior.

        Returns:
            A dictionary containing the model's configuration parameters.
        """
        return self._config

    def update_usage(self, usage: Dict[str, int], model_name: str = None) -> None:
        """Updates the internal token usage statistics and cost.

        Each model provider (e.g., OpenAI, Anthropic) may have a different usage format.
        This method should be implemented by subclasses to ensure correct parsing
        and aggregation of token usage.

        Behavior:
            - If `model_name` is provided, the method dynamically calculates and updates
              the cost based on the usage metrics and the pricing for the specified
              model.
            - If `model_name` is None, the method copies the cost value directly from
              the `usage` dictionary (if present), which is typically used when
              restoring state from a checkpoint.

        Args:
            usage (Dict[str, int]): A dictionary containing token usage metrics,
                such as `prompt_tokens`, `completion_tokens`, and `total_tokens`.
            model_name (str, optional): The name of the model for which the usage
                is being updated. If None, cost is copied from usage if available.

        Raises:
            NotImplementedError: If called on the base class without an implementation.
        """
        raise NotImplementedError

    def get_usage(self) -> Dict[str, int]:
        """Retrieves the current token usage statistics and cost (in USD).

        Returns:
            A dictionary containing cumulative token usage statistics since the model \
            instance was initialized.

        Examples:
            >>> model.get_usage()
            {
                'prompt_tokens': 1500,
                'completion_tokens': 1200,
                'total_tokens': 2700,
                'cost': {'amount': 12.00, 'currency': 'USD'}
            }
        """
        return self._usage.copy()

    def clear_usage(self) -> None:
        """Clears the token usage statistics.

        This resets all numerical values in the usage dictionary to zero (including
        nested values), while preserving the dictionary structure.
        """

        try:
            # Get the singleton websocket client
            _, ws_client = get_default_clients()

            payload = {
                "model_id": self.model_id,
            }
            response = run_in_background_loop(
                ws_client.call("clear_model_usage", payload)
            )
            if "error" in response:
                raise RuntimeError(
                    response["error"]["data"].get("exception", response["error"])
                )

            model_id = response["result"].get("model_id")
            if not model_id:
                raise RuntimeError(
                    f"Server did not return a model_id "
                    f"for payload: {payload!r}, response: {response!r}"
                )

            logger.debug(f"LM model usage cleared on the server: {self!r}")
        except Exception as e:
            logger.error(f"Failed to clear LM model usage on the server: {e}")
            raise

    def __deepcopy__(self, memo):
        if id(self) in memo:
            return memo[id(self)]
        # Save only the class type and any necessary metadata (e.g., usage details)
        cls_copy = {
            "class_type": self.__class__.__name__,
            "provider": self.provider,
            "usage": self.get_usage(),
        }

        # Store the copied object in memo before returning it
        memo[id(self)] = cls_copy
        return cls_copy

`init(provider=None, config=None, usage=None)`

Initializes the BaseModel instance.

Parameters:

Name	Type	Description	Default
`provider`	`str`	The name of the model provider (e.g., `"openai"`, `"anthropic"`).	`None`
`config`	`dict \| None`	A dictionary containing provider-specific configuration parameters, such as model name, temperature, max tokens, etc. This is an internal implementation detail used by `afnio` to create a `BaseModel` instance on the backend, and is not intended to be set directly by users. Subclasses can define their own expected configuration parameters and should ensure that they are included in this dictionary when initializing the base class.	`None`
`usage`	`dict \| None`	A dictionary to track token usage and cost information. It is typically initialized by subclasses with provider-specific usage metrics and cost structure.	`None`

Source code in afnio/models/model.py

def __init__(
    self,
    provider: str = None,
    config: Optional[dict] = None,
    usage: Optional[dict] = None,
):
    """Initializes the `BaseModel` instance.

    Args:
        provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
        config: A dictionary containing provider-specific configuration parameters,
            such as model name, temperature, max tokens, etc. This is an internal
            implementation detail used by `afnio` to create a `BaseModel` instance
            on the backend, and is not intended to be set directly by users.
            Subclasses can define their own expected configuration parameters and
            should ensure that they are included in this dictionary when
            initializing the base class.
        usage: A dictionary to track token usage and cost information. It is
            typically initialized by subclasses with provider-specific usage metrics
            and cost structure.
    """
    self.provider = provider
    self._config = config or {}
    self._usage = usage or {}
    self._usage.update(copy.deepcopy(INITIAL_COST))
    self.model_id = None

    # Request user consent before sending sensitive info to the server
    check_consent()

    try:
        # Get the singleton websocket client
        _, ws_client = get_default_clients()

        payload = {
            "class_type": self.__class__.__name__,
            "provider": self.provider,
            "config": self.get_config(),
            "usage": self.get_usage(),
        }
        response = run_in_background_loop(ws_client.call("create_model", payload))
        if "error" in response:
            raise RuntimeError(
                response["error"]["data"].get("exception", response["error"])
            )

        logger.debug(f"LM model created and shared with the server: {self!r}")

        model_id = response["result"].get("model_id")
        if not model_id:
            raise RuntimeError(
                f"Server did not return a model_id "
                f"for payload: {payload!r}, response: {response!r}"
            )
        self.model_id = model_id
        register_model(self)
    except Exception as e:
        logger.error(f"Failed to share LM model with the server: {e}")
        raise

`get_provider()`

Returns the model provider name.

Returns:

Name	Type	Description
`provider`	`str \| None`	The name of the model provider (e.g., `"openai"`, `"anthropic"`), or None if not set.

Source code in afnio/models/model.py

def get_provider(self) -> Optional[str]:
    """Returns the model provider name.

    Returns:
        provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`),
            or None if not set.
    """
    return self.provider

`get_config()`

Returns the model configuration.

This includes the model name, temperature, max tokens, and other parameters that are used to configure the model's behavior.

Returns:

Type	Description
`dict[str, str \| float \| int]`	A dictionary containing the model's configuration parameters.

Source code in afnio/models/model.py

def get_config(self) -> Dict[str, Union[str, float, int]]:
    """Returns the model configuration.

    This includes the model name, temperature, max tokens, and other
    parameters that are used to configure the model's behavior.

    Returns:
        A dictionary containing the model's configuration parameters.
    """
    return self._config

`update_usage(usage, model_name=None)`

Updates the internal token usage statistics and cost.

Each model provider (e.g., OpenAI, Anthropic) may have a different usage format. This method should be implemented by subclasses to ensure correct parsing and aggregation of token usage.

Behavior

If model_name is provided, the method dynamically calculates and updates the cost based on the usage metrics and the pricing for the specified model.
If model_name is None, the method copies the cost value directly from the usage dictionary (if present), which is typically used when restoring state from a checkpoint.

Parameters:

Name	Type	Description	Default
`usage`	`dict[str, int]`	A dictionary containing token usage metrics, such as `prompt_tokens`, `completion_tokens`, and `total_tokens`.	required
`model_name`	`str`	The name of the model for which the usage is being updated. If None, cost is copied from usage if available.	`None`

Raises:

Type	Description
`NotImplementedError`	If called on the base class without an implementation.

Source code in afnio/models/model.py

def update_usage(self, usage: Dict[str, int], model_name: str = None) -> None:
    """Updates the internal token usage statistics and cost.

    Each model provider (e.g., OpenAI, Anthropic) may have a different usage format.
    This method should be implemented by subclasses to ensure correct parsing
    and aggregation of token usage.

    Behavior:
        - If `model_name` is provided, the method dynamically calculates and updates
          the cost based on the usage metrics and the pricing for the specified
          model.
        - If `model_name` is None, the method copies the cost value directly from
          the `usage` dictionary (if present), which is typically used when
          restoring state from a checkpoint.

    Args:
        usage (Dict[str, int]): A dictionary containing token usage metrics,
            such as `prompt_tokens`, `completion_tokens`, and `total_tokens`.
        model_name (str, optional): The name of the model for which the usage
            is being updated. If None, cost is copied from usage if available.

    Raises:
        NotImplementedError: If called on the base class without an implementation.
    """
    raise NotImplementedError

`get_usage()`

Retrieves the current token usage statistics and cost (in USD).

Returns:

Type	Description
`dict[str, int]`	A dictionary containing cumulative token usage statistics since the model instance was initialized.

Examples:

>>> model.get_usage()
{
    'prompt_tokens': 1500,
    'completion_tokens': 1200,
    'total_tokens': 2700,
    'cost': {'amount': 12.00, 'currency': 'USD'}
}

Source code in afnio/models/model.py

def get_usage(self) -> Dict[str, int]:
    """Retrieves the current token usage statistics and cost (in USD).

    Returns:
        A dictionary containing cumulative token usage statistics since the model \
        instance was initialized.

    Examples:
        >>> model.get_usage()
        {
            'prompt_tokens': 1500,
            'completion_tokens': 1200,
            'total_tokens': 2700,
            'cost': {'amount': 12.00, 'currency': 'USD'}
        }
    """
    return self._usage.copy()

`clear_usage()`

Clears the token usage statistics.

This resets all numerical values in the usage dictionary to zero (including nested values), while preserving the dictionary structure.

Source code in afnio/models/model.py

def clear_usage(self) -> None:
    """Clears the token usage statistics.

    This resets all numerical values in the usage dictionary to zero (including
    nested values), while preserving the dictionary structure.
    """

    try:
        # Get the singleton websocket client
        _, ws_client = get_default_clients()

        payload = {
            "model_id": self.model_id,
        }
        response = run_in_background_loop(
            ws_client.call("clear_model_usage", payload)
        )
        if "error" in response:
            raise RuntimeError(
                response["error"]["data"].get("exception", response["error"])
            )

        model_id = response["result"].get("model_id")
        if not model_id:
            raise RuntimeError(
                f"Server did not return a model_id "
                f"for payload: {payload!r}, response: {response!r}"
            )

        logger.debug(f"LM model usage cleared on the server: {self!r}")
    except Exception as e:
        logger.error(f"Failed to clear LM model usage on the server: {e}")
        raise

`afnio.models.model.TextCompletionModel`

Bases: BaseModel

An abstraction for a language model that accepts a prompt composed of a single text input and generates a textual completion.

Source code in afnio/models/model.py

class TextCompletionModel(BaseModel):
    """
    An abstraction for a language model that accepts a prompt composed of a single
    text input and generates a textual completion.
    """

    def __init__(self, provider: str = None, **kwargs):
        """Initializes the `TextCompletionModel` instance.

        Args:
            provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
            **kwargs: Recognized/expected keys are `usage` (a dictionary to track token
                usage and cost information) and any provider-specific configuration
                parameters.
        """
        super().__init__(provider=provider, **kwargs)

    async def acomplete(self, prompt: str, **kwargs) -> str:
        """
        Asynchronous method to generate a completion for the given prompt.

        Args:
            prompt: The input text for which the model should generate a completion.
            **kwargs: Additional parameters to configure the model's behavior during
                chat completion. This may include options such as:

                - model (`str`): The model to use (e.g., `"gpt-4o"`).
                - temperature (`float`): Amount of randomness injected into
                    the response.
                - max_completion_tokens (`int`): Maximum number of tokens to generate.
                - etc.

                For a complete list of supported parameters for each model, refer to the
                respective API documentation.

        Returns:
            A string containing the generated completion.
        """
        raise NotImplementedError

    def complete(self, prompt: str, **kwargs) -> str:
        """
        Synchronous method to generate a completion for the given prompt.

        Args:
            prompt: The input text for which the model should generate a completion.
            **kwargs: Additional parameters to configure the model's behavior during
                chat completion. This may include options such as:

                - model (`str`): The model to use (e.g., `"gpt-4o"`).
                - temperature (`float`): Amount of randomness injected into
                    the response.
                - max_completion_tokens (`int`): Maximum number of tokens to generate.
                - etc.

                For a complete list of supported parameters for each model, refer to the
                respective API documentation.

        Returns:
            A string containing the generated completion.
        """
        raise NotImplementedError

`init(provider=None, **kwargs)`

Initializes the TextCompletionModel instance.

Parameters:

Name	Type	Description	Default
`provider`	`str`	The name of the model provider (e.g., `"openai"`, `"anthropic"`).	`None`
`**kwargs`		Recognized/expected keys are `usage` (a dictionary to track token usage and cost information) and any provider-specific configuration parameters.	`{}`

Source code in afnio/models/model.py

def __init__(self, provider: str = None, **kwargs):
    """Initializes the `TextCompletionModel` instance.

    Args:
        provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
        **kwargs: Recognized/expected keys are `usage` (a dictionary to track token
            usage and cost information) and any provider-specific configuration
            parameters.
    """
    super().__init__(provider=provider, **kwargs)

`acomplete(prompt, **kwargs)` `async`

Asynchronous method to generate a completion for the given prompt.

Parameters:

Name	Type	Description	Default
`prompt`	`str`	The input text for which the model should generate a completion.	required
`**kwargs`		Additional parameters to configure the model's behavior during chat completion. This may include options such as: model (`str`): The model to use (e.g., `"gpt-4o"`). temperature (`float`): Amount of randomness injected into the response. max_completion_tokens (`int`): Maximum number of tokens to generate. etc. For a complete list of supported parameters for each model, refer to the respective API documentation.	`{}`

Returns:

Type	Description
`str`	A string containing the generated completion.

Source code in afnio/models/model.py

async def acomplete(self, prompt: str, **kwargs) -> str:
    """
    Asynchronous method to generate a completion for the given prompt.

    Args:
        prompt: The input text for which the model should generate a completion.
        **kwargs: Additional parameters to configure the model's behavior during
            chat completion. This may include options such as:

            - model (`str`): The model to use (e.g., `"gpt-4o"`).
            - temperature (`float`): Amount of randomness injected into
                the response.
            - max_completion_tokens (`int`): Maximum number of tokens to generate.
            - etc.

            For a complete list of supported parameters for each model, refer to the
            respective API documentation.

    Returns:
        A string containing the generated completion.
    """
    raise NotImplementedError

`complete(prompt, **kwargs)`

Synchronous method to generate a completion for the given prompt.

Parameters:

Name	Type	Description	Default
`prompt`	`str`	The input text for which the model should generate a completion.	required
`**kwargs`		Additional parameters to configure the model's behavior during chat completion. This may include options such as: model (`str`): The model to use (e.g., `"gpt-4o"`). temperature (`float`): Amount of randomness injected into the response. max_completion_tokens (`int`): Maximum number of tokens to generate. etc. For a complete list of supported parameters for each model, refer to the respective API documentation.	`{}`

Returns:

Type	Description
`str`	A string containing the generated completion.

Source code in afnio/models/model.py

def complete(self, prompt: str, **kwargs) -> str:
    """
    Synchronous method to generate a completion for the given prompt.

    Args:
        prompt: The input text for which the model should generate a completion.
        **kwargs: Additional parameters to configure the model's behavior during
            chat completion. This may include options such as:

            - model (`str`): The model to use (e.g., `"gpt-4o"`).
            - temperature (`float`): Amount of randomness injected into
                the response.
            - max_completion_tokens (`int`): Maximum number of tokens to generate.
            - etc.

            For a complete list of supported parameters for each model, refer to the
            respective API documentation.

    Returns:
        A string containing the generated completion.
    """
    raise NotImplementedError

`afnio.models.model.ChatCompletionModel`

Bases: BaseModel

An abstraction for a language model that accepts a prompt composed of an array of messages containing instructions for the model. Each message can have a different role, influencing how the model interprets the input.

Source code in afnio/models/model.py

class ChatCompletionModel(BaseModel):
    """
    An abstraction for a language model that accepts a prompt composed of an array
    of messages containing instructions for the model. Each message can have a
    different role, influencing how the model interprets the input.
    """

    def __init__(self, provider: str = None, **kwargs):
        """Initializes the `ChatCompletionModel` instance.

        Args:
            provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
            **kwargs: Recognized/expected keys are `usage` (a dictionary to track token
                usage and cost information) and any provider-specific configuration
                parameters.
        """
        super().__init__(provider=provider, **kwargs)

    # TODO: Add link to `API documentation` for kwargs of each supported model
    async def achat(self, messages: List[Dict[str, str]], **kwargs) -> str:
        """
        Asynchronous method to handle chat-based interactions with the model.

        Args:
            messages: A list of messages, where each message is represented as a
                dictionary with `"role"` (e.g., `"user"`, `"system"`) and `"content"`
                (the text of the message).
            **kwargs: Additional parameters to configure the model's behavior during
                chat completion. This may include options such as:

                - model (`str`): The model to use (e.g., `"gpt-4o"`).
                - temperature (`float`): Amount of randomness injected into
                    the response.
                - max_completion_tokens (`int`): Maximum number of tokens to generate.
                - etc.

                For a complete list of supported parameters for each model, refer to the
                respective API documentation.

        Returns:
            A string containing the model's response to the chat messages.
        """
        raise NotImplementedError

    def chat(self, messages: List[Dict[str, str]], **kwargs) -> str:
        """
        Synchronous method to handle chat-based interactions with the model.

        Args:
            messages: A list of messages, where each message is represented as a
                dictionary with `"role"` (e.g., `"user"`, `"system"`) and `"content"`
                (the text of the message).
            **kwargs: Additional parameters to configure the model's behavior during
                chat completion. This may include options such as:

                - model (`str`): The model to use (e.g., `"gpt-4o"`).
                - temperature (`float`): Amount of randomness injected into
                    the response.
                - max_completion_tokens (`int`): Maximum number of tokens to generate.
                - etc.

                For a complete list of supported parameters for each model, refer to the
                respective API documentation.

        Returns:
            A string containing the model's response to the chat messages.
        """
        raise NotImplementedError

`init(provider=None, **kwargs)`

Initializes the ChatCompletionModel instance.

Parameters:

Name	Type	Description	Default
`provider`	`str`	The name of the model provider (e.g., `"openai"`, `"anthropic"`).	`None`
`**kwargs`		Recognized/expected keys are `usage` (a dictionary to track token usage and cost information) and any provider-specific configuration parameters.	`{}`

Source code in afnio/models/model.py

def __init__(self, provider: str = None, **kwargs):
    """Initializes the `ChatCompletionModel` instance.

    Args:
        provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
        **kwargs: Recognized/expected keys are `usage` (a dictionary to track token
            usage and cost information) and any provider-specific configuration
            parameters.
    """
    super().__init__(provider=provider, **kwargs)

`achat(messages, **kwargs)` `async`

Asynchronous method to handle chat-based interactions with the model.

Parameters:

Name	Type	Description	Default
`messages`	`list[dict[str, str]]`	A list of messages, where each message is represented as a dictionary with `"role"` (e.g., `"user"`, `"system"`) and `"content"` (the text of the message).	required
`**kwargs`		Additional parameters to configure the model's behavior during chat completion. This may include options such as: model (`str`): The model to use (e.g., `"gpt-4o"`). temperature (`float`): Amount of randomness injected into the response. max_completion_tokens (`int`): Maximum number of tokens to generate. etc. For a complete list of supported parameters for each model, refer to the respective API documentation.	`{}`

Returns:

Type	Description
`str`	A string containing the model's response to the chat messages.

Source code in afnio/models/model.py

async def achat(self, messages: List[Dict[str, str]], **kwargs) -> str:
    """
    Asynchronous method to handle chat-based interactions with the model.

    Args:
        messages: A list of messages, where each message is represented as a
            dictionary with `"role"` (e.g., `"user"`, `"system"`) and `"content"`
            (the text of the message).
        **kwargs: Additional parameters to configure the model's behavior during
            chat completion. This may include options such as:

            - model (`str`): The model to use (e.g., `"gpt-4o"`).
            - temperature (`float`): Amount of randomness injected into
                the response.
            - max_completion_tokens (`int`): Maximum number of tokens to generate.
            - etc.

            For a complete list of supported parameters for each model, refer to the
            respective API documentation.

    Returns:
        A string containing the model's response to the chat messages.
    """
    raise NotImplementedError

`chat(messages, **kwargs)`

Synchronous method to handle chat-based interactions with the model.

Parameters:

Name	Type	Description	Default
`messages`	`list[dict[str, str]]`	A list of messages, where each message is represented as a dictionary with `"role"` (e.g., `"user"`, `"system"`) and `"content"` (the text of the message).	required
`**kwargs`		Additional parameters to configure the model's behavior during chat completion. This may include options such as: model (`str`): The model to use (e.g., `"gpt-4o"`). temperature (`float`): Amount of randomness injected into the response. max_completion_tokens (`int`): Maximum number of tokens to generate. etc. For a complete list of supported parameters for each model, refer to the respective API documentation.	`{}`

Returns:

Type	Description
`str`	A string containing the model's response to the chat messages.

Source code in afnio/models/model.py

def chat(self, messages: List[Dict[str, str]], **kwargs) -> str:
    """
    Synchronous method to handle chat-based interactions with the model.

    Args:
        messages: A list of messages, where each message is represented as a
            dictionary with `"role"` (e.g., `"user"`, `"system"`) and `"content"`
            (the text of the message).
        **kwargs: Additional parameters to configure the model's behavior during
            chat completion. This may include options such as:

            - model (`str`): The model to use (e.g., `"gpt-4o"`).
            - temperature (`float`): Amount of randomness injected into
                the response.
            - max_completion_tokens (`int`): Maximum number of tokens to generate.
            - etc.

            For a complete list of supported parameters for each model, refer to the
            respective API documentation.

    Returns:
        A string containing the model's response to the chat messages.
    """
    raise NotImplementedError

`afnio.models.model.EmbeddingModel`

Bases: BaseModel

An abstraction for a model that generates embeddings for input texts.

Source code in afnio/models/model.py

class EmbeddingModel(BaseModel):
    """
    An abstraction for a model that generates embeddings for input texts.
    """

    def __init__(self, provider: str = None, **kwargs):
        """Initializes the `EmbeddingModel` instance.

        Args:
            provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
            **kwargs: Recognized/expected keys are `usage` (a dictionary to track token
                usage and cost information) and any provider-specific configuration
                parameters.
        """
        super().__init__(provider=provider, **kwargs)

    async def aembed(self, input: List[str], **kwargs) -> List[List[float]]:
        """
        Asynchronous method to generate embeddings for the given input texts.

        Args:
            input: A list of input strings for which embeddings should be generated.
            **kwargs: Additional parameters to configure the model's behavior during
                chat completion. This may include options such as:

                - model (`str`): The model to use (e.g., `"gpt-4o"`).
                - temperature (`float`): Amount of randomness injected into
                    the response.
                - max_completion_tokens (`int`): Maximum number of tokens to generate.
                - etc.

                For a complete list of supported parameters for each model, refer to the
                respective API documentation.

        Returns:
            A list of embeddings, where each embedding is represented \
            as a list of floats corresponding to the input strings.
        """
        raise NotImplementedError

    def embed(self, input: List[str], **kwargs) -> List[List[float]]:
        """
        Synchronous method to generate embeddings for the given input texts.

        Args:
            input: A list of input strings for which embeddings should be generated.
            **kwargs: Additional parameters to configure the model's behavior during
                chat completion. This may include options such as:

                - model (`str`): The model to use (e.g., `"gpt-4o"`).
                - temperature (`float`): Amount of randomness injected into
                    the response.
                - max_completion_tokens (`int`): Maximum number of tokens to generate.
                - etc.

                For a complete list of supported parameters for each model, refer to the
                respective API documentation.

        Returns:
            A list of embeddings, where each embedding is represented \
            as a list of floats corresponding to the input strings.
        """
        raise NotImplementedError

`init(provider=None, **kwargs)`

Initializes the EmbeddingModel instance.

Parameters:

Name	Type	Description	Default
`provider`	`str`	The name of the model provider (e.g., `"openai"`, `"anthropic"`).	`None`
`**kwargs`		Recognized/expected keys are `usage` (a dictionary to track token usage and cost information) and any provider-specific configuration parameters.	`{}`

Source code in afnio/models/model.py

def __init__(self, provider: str = None, **kwargs):
    """Initializes the `EmbeddingModel` instance.

    Args:
        provider: The name of the model provider (e.g., `"openai"`, `"anthropic"`).
        **kwargs: Recognized/expected keys are `usage` (a dictionary to track token
            usage and cost information) and any provider-specific configuration
            parameters.
    """
    super().__init__(provider=provider, **kwargs)

`aembed(input, **kwargs)` `async`

Asynchronous method to generate embeddings for the given input texts.

Parameters:

Name	Type	Description	Default
`input`	`list[str]`	A list of input strings for which embeddings should be generated.	required
`**kwargs`		Additional parameters to configure the model's behavior during chat completion. This may include options such as: model (`str`): The model to use (e.g., `"gpt-4o"`). temperature (`float`): Amount of randomness injected into the response. max_completion_tokens (`int`): Maximum number of tokens to generate. etc. For a complete list of supported parameters for each model, refer to the respective API documentation.	`{}`

Returns:

Type	Description
`list[list[float]]`	A list of embeddings, where each embedding is represented as a list of floats corresponding to the input strings.

Source code in afnio/models/model.py

async def aembed(self, input: List[str], **kwargs) -> List[List[float]]:
    """
    Asynchronous method to generate embeddings for the given input texts.

    Args:
        input: A list of input strings for which embeddings should be generated.
        **kwargs: Additional parameters to configure the model's behavior during
            chat completion. This may include options such as:

            - model (`str`): The model to use (e.g., `"gpt-4o"`).
            - temperature (`float`): Amount of randomness injected into
                the response.
            - max_completion_tokens (`int`): Maximum number of tokens to generate.
            - etc.

            For a complete list of supported parameters for each model, refer to the
            respective API documentation.

    Returns:
        A list of embeddings, where each embedding is represented \
        as a list of floats corresponding to the input strings.
    """
    raise NotImplementedError

`embed(input, **kwargs)`

Synchronous method to generate embeddings for the given input texts.

Parameters:

Name	Type	Description	Default
`input`	`list[str]`	A list of input strings for which embeddings should be generated.	required
`**kwargs`		Additional parameters to configure the model's behavior during chat completion. This may include options such as: model (`str`): The model to use (e.g., `"gpt-4o"`). temperature (`float`): Amount of randomness injected into the response. max_completion_tokens (`int`): Maximum number of tokens to generate. etc. For a complete list of supported parameters for each model, refer to the respective API documentation.	`{}`

Returns:

Type	Description
`list[list[float]]`	A list of embeddings, where each embedding is represented as a list of floats corresponding to the input strings.

Source code in afnio/models/model.py

def embed(self, input: List[str], **kwargs) -> List[List[float]]:
    """
    Synchronous method to generate embeddings for the given input texts.

    Args:
        input: A list of input strings for which embeddings should be generated.
        **kwargs: Additional parameters to configure the model's behavior during
            chat completion. This may include options such as:

            - model (`str`): The model to use (e.g., `"gpt-4o"`).
            - temperature (`float`): Amount of randomness injected into
                the response.
            - max_completion_tokens (`int`): Maximum number of tokens to generate.
            - etc.

            For a complete list of supported parameters for each model, refer to the
            respective API documentation.

    Returns:
        A list of embeddings, where each embedding is represented \
        as a list of floats corresponding to the input strings.
    """
    raise NotImplementedError

afnio.models.model

afnio.models.model.BaseModel

__init__(provider=None, config=None, usage=None)

get_provider()

get_config()

update_usage(usage, model_name=None)

get_usage()

clear_usage()

afnio.models.model.TextCompletionModel

__init__(provider=None, **kwargs)

acomplete(prompt, **kwargs) async

complete(prompt, **kwargs)

afnio.models.model.ChatCompletionModel

__init__(provider=None, **kwargs)

achat(messages, **kwargs) async

chat(messages, **kwargs)

afnio.models.model.EmbeddingModel

__init__(provider=None, **kwargs)

aembed(input, **kwargs) async

embed(input, **kwargs)

`afnio.models.model`

`afnio.models.model.BaseModel`

`init(provider=None, config=None, usage=None)`

`get_provider()`

`get_config()`

`update_usage(usage, model_name=None)`

`get_usage()`

`clear_usage()`

`afnio.models.model.TextCompletionModel`

`init(provider=None, **kwargs)`

`acomplete(prompt, **kwargs)` `async`

`complete(prompt, **kwargs)`

`afnio.models.model.ChatCompletionModel`

`init(provider=None, **kwargs)`

`achat(messages, **kwargs)` `async`

`chat(messages, **kwargs)`

`afnio.models.model.EmbeddingModel`

`init(provider=None, **kwargs)`

`aembed(input, **kwargs)` `async`

`embed(input, **kwargs)`