MultiUnify - Unify Documentation

class MultiUnify

source code

init

source code

def __init__(
        self,
        endpoints: Optional[Union[str, Iterable[str]]] = None,
        *,
        system_message: Optional[str] = None,
        messages: Optional[
            Union[
                List[ChatCompletionMessageParam],
                Dict[str, List[ChatCompletionMessageParam]],
            ]
        ] = None,
        frequency_penalty: Optional[float] = None,
        logit_bias: Optional[Dict[str, int]] = None,
        logprobs: Optional[bool] = None,
        top_logprobs: Optional[int] = None,
        max_completion_tokens: Optional[int] = None,
        n: Optional[int] = None,
        presence_penalty: Optional[float] = None,
        response_format: Optional[Union[Type[BaseModel], Dict[str, str]]] = None,
        seed: Optional[int] = None,
        stop: Union[Optional[str], List[str]] = None,
        temperature: Optional[float] = 1.0,
        top_p: Optional[float] = None,
        service_tier: Optional[str] = None,
        tools: Optional[Iterable[ChatCompletionToolParam]] = None,
        tool_choice: Optional[ChatCompletionToolChoiceOptionParam] = None,
        parallel_tool_calls: Optional[bool] = None,
        reasoning_effort: Optional[str] = None,
        # platform arguments
        use_custom_keys: bool = False,
        tags: Optional[List[str]] = None,
        drop_params: Optional[bool] = True,
        region: Optional[str] = None,
        log_query_body: Optional[bool] = True,
        log_response_body: Optional[bool] = True,
        api_key: Optional[str] = None,
        # python client arguments
        stateful: bool = False,
        return_full_completion: bool = False,
        traced: bool = False,
        direct_mode: bool = False,
        cache: Union[bool, str] = None,
        cache_backend: Optional[str] = None,
        # passthrough arguments
        extra_headers: Optional[Headers] = None,
        extra_query: Optional[Query] = None,
        **kwargs,
    ) -> None:

Initialize the Multi LLM Unify client. Arguments:

endpoints - A single endpoint name or a list of endpoint names, with each name
system_message - An optional string containing the system message. This
messages - A list of messages comprising the conversation so far. This will
frequency_penalty - Number between -2.0 and 2.0. Positive values penalize new
logit_bias - Modify the likelihood of specified tokens appearing in the
logprobs - Whether to return log probabilities of the output tokens or not.
top_logprobs - An integer between 0 and 20 specifying the number of most
max_completion_tokens - The maximum number of tokens that can be generated in
n - How many chat completion choices to generate for each input message. Note
presence_penalty - Number between -2.0 and 2.0. Positive values penalize new
response_format - An object specifying the format that the model must output.
seed - If specified, a best effort attempt is made to sample
stop - Up to 4 sequences where the API will stop generating further tokens.
temperature - What sampling temperature to use, between 0 and 2.
top_p - An alternative to sampling with temperature, called nucleus sampling,
tools - A list of tools the model may call. Currently, only functions are
tool_choice - Controls which (if any) tool is called by the
parallel_tool_calls - Whether to enable parallel function calling during tool
use_custom_keys - Whether to use custom API keys or our unified API keys
tags - Arbitrary number of tags to classify this API query as needed. Helpful
drop_params - Whether or not to drop unsupported OpenAI params by the
region - A string used to represent the region where the endpoint is
log_query_body - Whether to log the contents of the query json body.
log_response_body - Whether to log the contents of the response json body.
stateful - Whether the conversation history is preserved within the messages
return_full_completion - If False, only return the message content
traced - Whether to trace the generate method.
cache - If True, then the arguments will be stored in a local cache file, and
extra_headers - Additional “passthrough” headers for the request which are
extra_query - Additional “passthrough” query parameters for the request which
kwargs - Additional “passthrough” JSON properties for the body of the

Raises:

UnifyError: If the API key is missing.

properties

cache

source code

def cache(self) -> bool:

Get default the cache bool. Returns: The default cache bool.

clients

source code

def clients(self) -> Dict[str, _UniClient]:

Get the current dictionary of clients, with endpoint names as keys and Unify or AsyncUnify instances as values. Returns: The dictionary of clients.

drop_params

source code

def drop_params(self) -> Optional[bool]:

Get the default drop_params bool, if set. Returns: The default drop_params bool.

endpoints

source code

def endpoints(self) -> Tuple[str, ...]:

Get the current tuple of endpoints. Returns: The tuple of endpoints.

extra_body

source code

def extra_body(self) -> Optional[Mapping[str, str]]:

Get the default extra body, if set. Returns: The default extra body.

extra_headers

source code

def extra_headers(self) -> Optional[Headers]:

Get the default extra headers, if set. Returns: The default extra headers.

extra_query

source code

def extra_query(self) -> Optional[Query]:

Get the default extra query, if set. Returns: The default extra query.

frequency_penalty

source code

def frequency_penalty(self) -> Optional[float]:

Get the default frequency penalty, if set. Returns: The default frequency penalty.

log_query_body

source code

def log_query_body(self) -> Optional[bool]:

Get the default log query body bool, if set. Returns: The default log query body bool.

log_response_body

source code

def log_response_body(self) -> Optional[bool]:

Get the default log response body bool, if set. Returns: The default log response body bool.

logit_bias

source code

def logit_bias(self) -> Optional[Dict[str, int]]:

Get the default logit bias, if set. Returns: The default logit bias.

logprobs

source code

def logprobs(self) -> Optional[bool]:

Get the default logprobs, if set. Returns: The default logprobs.

max_completion_tokens

source code

def max_completion_tokens(self) -> Optional[int]:

Get the default max tokens, if set. Returns: The default max tokens.

messages

source code

def messages(
        self,
    ) -> Optional[
        Union[
            List[ChatCompletionMessageParam],
            Dict[str, List[ChatCompletionMessageParam]],
        ]
    ]:

Get the default messages, if set. Returns: The default messages.

n

source code

def n(self) -> Optional[int]:

Get the default n, if set. Returns: The default n value.

parallel_tool_calls

source code

def parallel_tool_calls(self) -> Optional[bool]:

Get the default parallel tool calls bool, if set. Returns: The default parallel tool calls bool.

presence_penalty

source code

def presence_penalty(self) -> Optional[float]:

Get the default presence penalty, if set. Returns: The default presence penalty.

reasoning_effort

source code

def reasoning_effort(self) -> Optional[str]:

Get the default reasoning, if set. Returns: The default reasoning.

region

source code

def region(self) -> Optional[str]:

Get the default region, if set. Returns: The default region.

response_format

source code

def response_format(self) -> Optional[Union[Type[BaseModel], Dict[str, str]]]:

Get the default response format, if set. Returns: The default response format.

return_full_completion

source code

def return_full_completion(self) -> bool:

Get the default return full completion bool. Returns: The default return full completion bool.

seed

source code

def seed(self) -> Optional[int]:

Get the default seed value, if set. Returns: The default seed value.

service_tier

source code

def service_tier(self) -> Optional[str]:

Get the default service tier, if set. Returns: The default service tier.

stateful

source code

def stateful(self) -> bool:

Get the default stateful bool, if set. Returns: The default stateful bool.

stop

source code

def stop(self) -> Union[Optional[str], List[str]]:

Get the default stop value, if set. Returns: The default stop value.

stream

source code

def stream(self) -> Optional[bool]:

Get the default stream bool, if set. Returns: The default stream bool.

stream_options

source code

def stream_options(self) -> Optional[ChatCompletionStreamOptionsParam]:

Get the default stream options, if set. Returns: The default stream options.

system_message

source code

def system_message(self) -> Optional[str]:

Get the default system message, if set. Returns: The default system message.

temperature

source code

def temperature(self) -> Optional[float]:

Get the default temperature, if set. Returns: The default temperature.

tool_choice

source code

def tool_choice(self) -> Optional[ChatCompletionToolChoiceOptionParam]:

Get the default tool choice, if set. Returns: The default tool choice.

tools

source code

def tools(self) -> Optional[Iterable[ChatCompletionToolParam]]:

Get the default tools, if set. Returns: The default tools.

top_logprobs

source code

def top_logprobs(self) -> Optional[int]:

Get the default top logprobs, if set. Returns: The default top logprobs.

top_p

source code

def top_p(self) -> Optional[float]:

Get the default top p value, if set. Returns: The default top p value.

traced

source code

def traced(self) -> bool:

Get the default traced bool. Returns: The default traced bool.

use_custom_keys

source code

def use_custom_keys(self) -> bool:

Get the default use custom keys bool, if set. Returns: The default use custom keys bool.

setters

set_cache

source code

def set_cache(self, value: bool) -> Self:

Set the default cache bool. Arguments:

value - The default cache bool.

Returns: This client, useful for chaining inplace calls.

set_cache_backend

source code

def set_cache_backend(self, value: str) -> Self:

Set the default cache backend. Arguments:

value - The default cache backend.

Returns: This client, useful for chaining inplace calls.

set_direct_mode

source code

def set_direct_mode(self, value: bool) -> Self:

Set the default direct mode bool. Arguments:

value - The default direct mode bool.

Returns: This client, useful for chaining inplace calls.

set_drop_params

source code

def set_drop_params(self, value: bool) -> Self:

Set the default drop params bool. Arguments:

value - The default drop params bool.

Returns: This client, useful for chaining inplace calls.

set_extra_body

source code

def set_extra_body(self, value: Body) -> Self:

Set the default extra body. Arguments:

value - The default extra body.

Returns: This client, useful for chaining inplace calls.

set_extra_headers

source code

def set_extra_headers(self, value: Headers) -> Self:

Set the default extra headers. Arguments:

value - The default extra headers.

Returns: This client, useful for chaining inplace calls.

set_extra_query

source code

def set_extra_query(self, value: Query) -> Self:

Set the default extra query. Arguments:

value - The default extra query.

Returns: This client, useful for chaining inplace calls.

set_frequency_penalty

source code

def set_frequency_penalty(self, value: float) -> Self:

Set the default frequency penalty. Arguments:

value - The default frequency penalty.

Returns: This client, useful for chaining inplace calls.

set_log_query_body

source code

def set_log_query_body(self, value: bool) -> Self:

Set the default log query body bool. Arguments:

value - The default log query body bool.

Returns: This client, useful for chaining inplace calls.

set_log_response_body

source code

def set_log_response_body(self, value: bool) -> Self:

Set the default log response body bool. Arguments:

value - The default log response body bool.

Returns: This client, useful for chaining inplace calls.

set_logit_bias

source code

def set_logit_bias(self, value: Dict[str, int]) -> Self:

Set the default logit bias. Arguments:

value - The default logit bias.

Returns: This client, useful for chaining inplace calls.

set_logprobs

source code

def set_logprobs(self, value: bool) -> Self:

Set the default logprobs. Arguments:

value - The default logprobs.

Returns: This client, useful for chaining inplace calls.

set_max_completion_tokens

source code

def set_max_completion_tokens(self, value: int) -> Self:

Set the default max tokens. Arguments:

value - The default max tokens.

Returns: This client, useful for chaining inplace calls.

set_messages

source code

def set_messages(
        self,
        value: Union[
            List[ChatCompletionMessageParam],
            Dict[str, List[ChatCompletionMessageParam]],
        ],
    ) -> Self:

Set the default messages. Arguments:

value - The default messages.

Returns: This client, useful for chaining inplace calls.

set_n

source code

def set_n(self, value: int) -> Self:

Set the default n value. Arguments:

value - The default n value.

Returns: This client, useful for chaining inplace calls.

set_parallel_tool_calls

source code

def set_parallel_tool_calls(self, value: bool) -> Self:

Set the default parallel tool calls bool. Arguments:

value - The default parallel tool calls bool.

Returns: This client, useful for chaining inplace calls.

set_presence_penalty

source code

def set_presence_penalty(self, value: float) -> Self:

Set the default presence penalty. Arguments:

value - The default presence penalty.

Returns: This client, useful for chaining inplace calls.

set_reasoning_effort

source code

def set_reasoning_effort(self, value: str) -> Self:

Set the default reasoning effort. Arguments:

value - The default reasoning effort.

Returns: This client, useful for chaining inplace calls.

set_region

source code

def set_region(self, value: str) -> Self:

Set the default region. Arguments:

value - The default region.

Returns: This client, useful for chaining inplace calls.

set_response_format

source code

def set_response_format(
        self,
        value: Optional[Union[Type[BaseModel], Dict[str, str]]],
    ) -> Self:

Set the default response format. Arguments:

value - The default response format.

Returns: This client, useful for chaining inplace calls.

set_return_full_completion

source code

def set_return_full_completion(self, value: bool) -> Self:

Set the default return full completion bool. Arguments:

value - The default return full completion bool.

Returns: This client, useful for chaining inplace calls.

set_seed

source code

def set_seed(self, value: Optional[int]) -> Self:

Set the default seed value. Arguments:

value - The default seed value.

Returns: This client, useful for chaining inplace calls.

set_service_tier

source code

def set_service_tier(self, value: Optional[str]) -> Self:

Set the default service tier. Arguments:

value - The default service tier.

Returns: This client, useful for chaining inplace calls.

set_stateful

source code

def set_stateful(self, value: bool) -> Self:

Set the default stateful bool. Arguments:

value - The default stateful bool.

Returns: This client, useful for chaining inplace calls.

set_stop

source code

def set_stop(self, value: Union[str, List[str]]) -> Self:

Set the default stop value. Arguments:

value - The default stop value.

Returns: This client, useful for chaining inplace calls.

set_stream

source code

def set_stream(self, value: bool) -> Self:

Set the default stream bool. Arguments:

value - The default stream bool.

Returns: This client, useful for chaining inplace calls.

set_stream_options

source code

def set_stream_options(self, value: ChatCompletionStreamOptionsParam) -> Self:

Set the default stream options. Arguments:

value - The default stream options.

Returns: This client, useful for chaining inplace calls.

set_system_message

source code

def set_system_message(self, value: str) -> Self:

Set the default system message. Arguments:

value - The default system message.

Returns: This client, useful for chaining inplace calls.

set_tags

source code

def set_tags(self, value: List[str]) -> Self:

Set the default tags. Arguments:

value - The default tags.

Returns: This client, useful for chaining inplace calls.

set_temperature

source code

def set_temperature(self, value: float) -> Self:

Set the default temperature. Arguments:

value - The default temperature.

Returns: This client, useful for chaining inplace calls.

set_tool_choice

source code

def set_tool_choice(self, value: ChatCompletionToolChoiceOptionParam) -> Self:

Set the default tool choice. Arguments:

value - The default tool choice.

Returns: This client, useful for chaining inplace calls.

set_tools

source code

def set_tools(self, value: Iterable[ChatCompletionToolParam]) -> Self:

Set the default tools. Arguments:

value - The default tools.

Returns: This client, useful for chaining inplace calls.

set_top_logprobs

source code

def set_top_logprobs(self, value: int) -> Self:

Set the default top logprobs. Arguments:

value - The default top logprobs.

Returns: This client, useful for chaining inplace calls.

set_top_p

source code

def set_top_p(self, value: float) -> Self:

Set the default top p value. Arguments:

value - The default top p value.

Returns: This client, useful for chaining inplace calls.

set_traced

source code

def set_traced(self, value: bool) -> Self:

Set the default traced bool. Arguments:

value - The default traced bool.

Returns: This client, useful for chaining inplace calls.

set_use_custom_keys

source code

def set_use_custom_keys(self, value: bool) -> Self:

Set the default use custom keys bool. Arguments:

value - The default use custom keys bool.

Returns: This client, useful for chaining inplace calls.

methods

add_endpoints

source code

def add_endpoints(
        self,
        endpoints: Union[List[str], str],
        ignore_duplicates: bool = True,
    ) -> Self:

Add extra endpoints to be queried for each call to generate. Arguments:

endpoints - The extra endpoints to add.
ignore_duplicates - Whether or not to ignore duplicate endpoints passed.

Returns: This client, useful for chaining inplace calls.

append_messages

source code

def append_messages(
        self,
        value: Union[
            List[ChatCompletionMessageParam],
            Dict[str, List[ChatCompletionMessageParam]],
        ],
    ) -> Self:

Append to the default messages. Arguments:

value - The messages to append to the default.

Returns: This client, useful for chaining inplace calls.

copy

source code

def copy(self):

generate

source code

def generate(
        self,
        arg0: Optional[Union[str, List[Union[str, Tuple[Any], Dict[str, Any]]]]] = None,
        /,
        system_message: Optional[str] = None,
        messages: Optional[
            Union[
                List[ChatCompletionMessageParam],
                Dict[str, List[ChatCompletionMessageParam]],
            ]
        ] = None,
        *,
        frequency_penalty: Optional[float] = None,
        logit_bias: Optional[Dict[str, int]] = None,
        logprobs: Optional[bool] = None,
        top_logprobs: Optional[int] = None,
        max_completion_tokens: Optional[int] = None,
        n: Optional[int] = None,
        presence_penalty: Optional[float] = None,
        response_format: Optional[Union[Type[BaseModel], Dict[str, str]]] = None,
        seed: Optional[int] = None,
        stop: Union[Optional[str], List[str]] = None,
        stream: Optional[bool] = None,
        stream_options: Optional[ChatCompletionStreamOptionsParam] = None,
        temperature: Optional[float] = None,
        top_p: Optional[float] = None,
        tools: Optional[Iterable[ChatCompletionToolParam]] = None,
        tool_choice: Optional[ChatCompletionToolChoiceOptionParam] = None,
        parallel_tool_calls: Optional[bool] = None,
        reasoning_effort: Optional[str] = None,
        # platform arguments
        use_custom_keys: Optional[bool] = None,
        tags: Optional[List[str]] = None,
        drop_params: Optional[bool] = None,
        region: Optional[str] = None,
        log_query_body: Optional[bool] = None,
        log_response_body: Optional[bool] = None,
        # python client arguments
        stateful: Optional[bool] = None,
        return_full_completion: Optional[bool] = None,
        cache: Optional[Union[bool, str]] = None,
        # passthrough arguments
        extra_headers: Optional[Headers] = None,
        extra_query: Optional[Query] = None,
        **kwargs,
    ):

Generate a ChatCompletion response for the specified endpoint, from the provided query parameters. Arguments:

arg0 - A string containing the user message, or a list containing the inputs
system_message - An optional string containing the system message. This
messages - A list of messages comprising the conversation so far, or
frequency_penalty - Number between -2.0 and 2.0. Positive values penalize new
logit_bias - Modify the likelihood of specified tokens appearing in the
logprobs - Whether to return log probabilities of the output tokens or not.
top_logprobs - An integer between 0 and 20 specifying the number of most
max_completion_tokens - The maximum number of tokens that can be generated in
n - How many chat completion choices to generate for each input message. Note
presence_penalty - Number between -2.0 and 2.0. Positive values penalize new
response_format - An object specifying the format that the model must output.
seed - If specified, a best effort attempt is made to sample
stop - Up to 4 sequences where the API will stop generating further tokens.
stream - If True, generates content as a stream. If False, generates content
stream_options - Options for streaming response. Only set this when you set
stream - true.
temperature - What sampling temperature to use, between 0 and 2.
top_p - An alternative to sampling with temperature, called nucleus sampling,
tools - A list of tools the model may call. Currently, only functions are
tool_choice - Controls which (if any) tool is called by the
parallel_tool_calls - Whether to enable parallel function calling during tool
stateful - Whether the conversation history is preserved within the messages
use_custom_keys - Whether to use custom API keys or our unified API keys
tags - Arbitrary number of tags to classify this API query as needed. Helpful
drop_params - Whether or not to drop unsupported OpenAI params by the
region - A string used to represent the region where the endpoint is
log_query_body - Whether to log the contents of the query json body.
log_response_body - Whether to log the contents of the response json body.
stateful - Whether the conversation history is preserved within the messages
return_full_completion - If False, only return the message content
cache - If True, then the arguments will be stored in a local cache file, and
extra_headers - Additional “passthrough” headers for the request which are
extra_query - Additional “passthrough” query parameters for the request which
kwargs - Additional “passthrough” JSON properties for the body of the

Returns: If stream is True, returns a generator yielding chunks of content. If stream is False, returns a single string response. Raises:

UnifyError: If an error occurs during content generation.

get_credit_balance

source code

def get_credit_balance(self) -> Union[float, None]:

Get the remaining credits left on your account. Returns: The remaining credits on the account if successful, otherwise None. Raises: BadRequestError: If there was an HTTP error. ValueError: If there was an error parsing the JSON response.

BadRequestError - If there was an HTTP error.
ValueError - If there was an error parsing the JSON response.

json

source code

def json(self):

remove_endpoints

source code

def remove_endpoints(
        self,
        endpoints: Union[List[str], str],
        ignore_missing: bool = True,
    ) -> Self:

Remove endpoints from the current list, which are queried for each call to generate. Arguments:

endpoints - The extra endpoints to add.
ignore_missing - Whether or not to ignore endpoints passed which are not

Returns: This client, useful for chaining inplace calls.

reset_all

source code

def reset_all(self) -> Self:

Reset base client properties to their default values. Returns: This client, useful for chaining inplace calls.

reset_frequency_penalty

source code

def reset_frequency_penalty(self) -> Self:

Reset the frequency penalty to its default value. Returns: This client, useful for chaining inplace calls.

reset_logit_bias

source code

def reset_logit_bias(self) -> Self:

Reset the logit bias to its default value. Returns: This client, useful for chaining inplace calls.

reset_logprobs

source code

def reset_logprobs(self) -> Self:

Reset the logprobs to its default value. Returns: This client, useful for chaining inplace calls.

reset_max_completion_tokens

source code

def reset_max_completion_tokens(self) -> Self:

Reset the max completion tokens to its default value. Returns: This client, useful for chaining inplace calls.

reset_messages

source code

def reset_messages(self) -> Self:

Reset the messages to their default value. Returns: This client, useful for chaining inplace calls.

reset_n

source code

def reset_n(self) -> Self:

Reset n to its default value. Returns: This client, useful for chaining inplace calls.

reset_parallel_tool_calls

source code

def reset_parallel_tool_calls(self) -> Self:

Reset the parallel tool calls to its default value. Returns: This client, useful for chaining inplace calls.

reset_presence_penalty

source code

def reset_presence_penalty(self) -> Self:

Reset the presence penalty to its default value. Returns: This client, useful for chaining inplace calls.

reset_reasoning_effort

source code

def reset_reasoning_effort(self) -> Self:

Reset the reasoning effort to its default value. Returns: This client, useful for chaining inplace calls.

reset_response_format

source code

def reset_response_format(self) -> Self:

Reset the response format to its default value. Returns: This client, useful for chaining inplace calls.

reset_seed

source code

def reset_seed(self) -> Self:

Reset the seed to its default value. Returns: This client, useful for chaining inplace calls.

reset_service_tier

source code

def reset_service_tier(self) -> Self:

Reset the service tier to its default value. Returns: This client, useful for chaining inplace calls.

reset_stop

source code

def reset_stop(self) -> Self:

Reset the stop value to its default value. Returns: This client, useful for chaining inplace calls.

reset_stream

source code

def reset_stream(self) -> Self:

Reset the stream value to its default value. Returns: This client, useful for chaining inplace calls.

reset_stream_options

source code

def reset_stream_options(self) -> Self:

Reset the stream options to their default value. Returns: This client, useful for chaining inplace calls.

reset_system_message

source code

def reset_system_message(self) -> Self:

Reset the system message to its default value. Returns: This client, useful for chaining inplace calls.

reset_temperature

source code

def reset_temperature(self) -> Self:

Reset the temperature to its default value. Returns: This client, useful for chaining inplace calls.

reset_tool_choice

source code

def reset_tool_choice(self) -> Self:

Reset the tool choice to its default value. Returns: This client, useful for chaining inplace calls.

reset_tools

source code

def reset_tools(self) -> Self:

Reset the tools to their default value. Returns: This client, useful for chaining inplace calls.

reset_top_logprobs

source code

def reset_top_logprobs(self) -> Self:

Reset the top logprobs to its default value. Returns: This client, useful for chaining inplace calls.

reset_top_p

source code

def reset_top_p(self) -> Self:

Reset the top p value to its default value. Returns: This client, useful for chaining inplace calls.

to_async_client

source code

def to_async_client(self):

Return an asynchronous version of the client (AsyncMultiUnify instance), with the exact same configuration as this synchronous (MultiUnify) client. Returns: An AsyncMultiUnify instance with the same configuration as this MultiUnify instance.

dunder_methods

repr

source code

def __repr__(self):

str

source code

def __str__(self):

​__init__

​properties

​cache

​clients

​drop_params

​endpoints

​extra_body

​extra_headers

​extra_query

​frequency_penalty

​log_query_body

​log_response_body

​logit_bias

​logprobs

​max_completion_tokens

​messages

​n

​parallel_tool_calls

​presence_penalty

​reasoning_effort

​region

​response_format

​return_full_completion

​seed

​service_tier

​stateful

​stop

​stream

​stream_options

​system_message

​tags

​temperature

​tool_choice

​tools

​top_logprobs

​top_p

​traced

​use_custom_keys

​setters

​set_cache

​set_cache_backend

​set_direct_mode

​set_drop_params

​set_extra_body

​set_extra_headers

​set_extra_query

​set_frequency_penalty

​set_log_query_body

​set_log_response_body

​set_logit_bias

​set_logprobs

​set_max_completion_tokens

​set_messages

​set_n

​set_parallel_tool_calls

​set_presence_penalty

​set_reasoning_effort

​set_region

​set_response_format

​set_return_full_completion

​set_seed

​set_service_tier

​set_stateful

​set_stop

​set_stream

​set_stream_options

​set_system_message

​set_tags

​set_temperature

​set_tool_choice

​set_tools

​set_top_logprobs

​set_top_p

​set_traced

​set_use_custom_keys

​methods

​add_endpoints

​append_messages

​copy

​generate

init

properties

cache

clients

drop_params

endpoints

extra_body

extra_headers

extra_query

frequency_penalty

log_query_body

log_response_body

logit_bias

logprobs

max_completion_tokens

messages

n

parallel_tool_calls

presence_penalty

reasoning_effort

region

response_format

return_full_completion

seed

service_tier

stateful

stop

stream

stream_options

system_message

tags

temperature

tool_choice

tools

top_logprobs

top_p

traced

use_custom_keys

setters

set_cache

set_cache_backend

set_direct_mode

set_drop_params

set_extra_body

set_extra_headers

set_extra_query

set_frequency_penalty

set_log_query_body

set_log_response_body

set_logit_bias

set_logprobs

set_max_completion_tokens

set_messages

set_n

set_parallel_tool_calls

set_presence_penalty

set_reasoning_effort

set_region

set_response_format

set_return_full_completion

set_seed

set_service_tier

set_stateful

set_stop

set_stream

set_stream_options

set_system_message

set_tags

set_temperature

set_tool_choice

set_tools

set_top_logprobs

set_top_p

set_traced

set_use_custom_keys

methods

add_endpoints

append_messages

copy

generate