Source code for council.llm.base.providers.ollama.ollama_llm_configuration

from __future__ import annotations

from typing import Any, Dict, Final, List, Literal, Mapping, Optional, Tuple, Type, Union

from council.utils import Parameter, greater_than_validator, must_read_env_str, read_env_str, zero_to_one_validator

from ...llm_base import LLMConfigurationBase
from ...llm_config_object import LLMConfigSpec, LLMProviders

_env_var_prefix: Final[str] = "OLLAMA_"



[docs]
class OllamaLLMConfiguration(LLMConfigurationBase):

[docs]
    def __init__(self, model: str, keep_alive: Optional[Union[float, str]] = None, json_mode: bool = False) -> None:
        """
        Initialize a new instance

        Args:
            model (str): model name to use from https://ollama.com/library
            keep_alive (Optional[float | str]): ollama keep_alive parameter
            json_mode (bool): whenever to use json mode, default False
        """
        super().__init__()
        self._model = Parameter.string(name="model", required=True, value=model)
        keep_alive_value = keep_alive if keep_alive is None else str(keep_alive)
        self._keep_alive = Parameter.string(name="keep_alive", required=False, value=keep_alive_value)
        self._json_mode = Parameter.bool(name="json_mode", required=False, value=json_mode)

        # https://github.com/ollama/ollama/blob/main/docs/modelfile.md#valid-parameters-and-values
        self._mirostat = Parameter.int(name="mirostat", required=False)
        self._mirostat_eta = Parameter.float(name="mirostat_eta", required=False)
        self._mirostat_tau = Parameter.float(name="mirostat_tau", required=False)
        self._num_ctx = Parameter.int(name="num_ctx", required=False, validator=greater_than_validator(0))
        self._repeat_last_n = Parameter.int(name="repeat_last_n", required=False)
        self._repeat_penalty = Parameter.float(name="repeat_penalty", required=False)
        self._temperature = Parameter.float(
            name="temperature", required=False, default=0.0, validator=zero_to_one_validator
        )
        self._seed = Parameter.int(name="seed", required=False)
        self._stop = Parameter.string(name="stop", required=False)
        self._tfs_z = Parameter.float(name="tfs_z", required=False)
        self._num_predict = Parameter.int(name="num_predict", required=False)
        self._top_p = Parameter.float(name="top_p", required=False, validator=zero_to_one_validator)
        self._top_k = Parameter.int(name="top_k", required=False, validator=greater_than_validator(0))
        self._min_p = Parameter.float(name="min_p", required=False)


    def model_name(self) -> str:
        return self._model.unwrap()

    @property
    def model(self) -> Parameter[str]:
        """Ollama model."""
        return self._model

    @property
    def keep_alive(self) -> Parameter[str]:
        """
        Number of seconds / duration string to keep model in memory.
        See https://github.com/ollama/ollama/blob/main/docs/faq.md#how-do-i-keep-a-model-loaded-in-memory-or-make-it-unload-immediately
        """
        return self._keep_alive

    @property
    def keep_alive_value(self) -> Optional[Union[float, str]]:
        """Convert keep_alive parameter to a format expected by ollama."""
        keep_alive_value = self.keep_alive.value
        if keep_alive_value is None:
            return None

        try:
            return float(keep_alive_value)
        except ValueError:
            return keep_alive_value

    @property
    def json_mode(self) -> Parameter[bool]:
        """Whenever to return json. Will be converted into ollama format parameter."""
        return self._json_mode

    @property
    def format(self) -> Literal["", "json"]:
        """The format to return a response in."""
        return "" if not self.json_mode.value else "json"

    @property
    def mirostat(self) -> Parameter[int]:
        """Enable Mirostat sampling for controlling perplexity."""
        return self._mirostat

    @property
    def mirostat_eta(self) -> Parameter[float]:
        """Learning rate for Mirostat sampling."""
        return self._mirostat_eta

    @property
    def mirostat_tau(self) -> Parameter[float]:
        """Controls balance between coherence and diversity."""
        return self._mirostat_tau

    @property
    def num_ctx(self) -> Parameter[int]:
        """Context window size."""
        return self._num_ctx

    @property
    def repeat_last_n(self) -> Parameter[int]:
        """Look back size for repetition prevention."""
        return self._repeat_last_n

    @property
    def repeat_penalty(self) -> Parameter[float]:
        """Penalty for repetition."""
        return self._repeat_penalty

    @property
    def temperature(self) -> Parameter[float]:
        """The temperature of the model."""
        return self._temperature

    @property
    def seed(self) -> Parameter[int]:
        """Random seed."""
        return self._seed

    @property
    def stop(self) -> Parameter[str]:
        """Stop sequence."""
        return self._stop

    @property
    def stop_value(self) -> Optional[List[str]]:
        """Format `stop` parameter. Only single value is supported currently."""
        return [self.stop.value] if self.stop.value is not None else None

    @property
    def tfs_z(self) -> Parameter[float]:
        """Tail free sampling parameter."""
        return self._tfs_z

    @property
    def num_predict(self) -> Parameter[int]:
        """Maximum number of tokens to predict."""
        return self._num_predict

    @property
    def top_k(self) -> Parameter[int]:
        """
        Only sample from the top K options for each subsequent token.
        Used to remove "long tail" low probability responses.
        """
        return self._top_k

    @property
    def top_p(self) -> Parameter[float]:
        """
        Use nucleus sampling.
        In nucleus sampling, we compute the cumulative distribution over all the options for each subsequent token in
        decreasing probability order and cut it off once it reaches a particular probability specified by top_p.
        """
        return self._top_p

    @property
    def min_p(self) -> Parameter[float]:
        """Minimum probability for token consideration"""
        return self._min_p


[docs]
    def params_to_options(self) -> Dict[str, Any]:
        """Convert parameters to options dict"""
        return {
            "mirostat": self.mirostat.value,
            "mirostat_eta": self.mirostat_eta.value,
            "mirostat_tau": self.mirostat_tau.value,
            "num_ctx": self.num_ctx.value,
            "repeat_last_n": self.repeat_last_n.value,
            "repeat_penalty": self.repeat_penalty.value,
            "temperature": self.temperature.value,
            "seed": self.seed.value,
            "stop": self.stop_value,
            "tfs_z": self.tfs_z.value,
            "num_predict": self.num_predict.value,
            "top_k": self.top_k.value,
            "top_p": self.top_p.value,
            "min_p": self.min_p.value,
        }


    @staticmethod
    def from_env() -> OllamaLLMConfiguration:
        model = must_read_env_str(_env_var_prefix + "LLM_MODEL")
        keep_alive = read_env_str(_env_var_prefix + "KEEP_ALIVE", required=False).as_optional()

        config = OllamaLLMConfiguration(model=model, keep_alive=keep_alive)
        return config

    @classmethod
    def from_spec(cls, spec: LLMConfigSpec) -> OllamaLLMConfiguration:
        spec.check_provider(LLMProviders.Ollama)

        model = spec.provider.must_get_value("model")
        config = OllamaLLMConfiguration(model=str(model))

        value = spec.provider.get_value("keep_alive")
        if value is not None:
            config.keep_alive.set(value)

        value = spec.provider.get_value("json_mode")
        if value is not None:
            config.json_mode.set(value)

        if spec.parameters is not None:
            param_mapping: Mapping[str, Tuple[Parameter, Type]] = {
                "mirostat": (config.mirostat, int),
                "mirostatEta": (config.mirostat_eta, float),
                "mirostatTau": (config.mirostat_tau, float),
                "numCtx": (config.num_ctx, int),
                "repeatLastN": (config.repeat_last_n, int),
                "repeatPenalty": (config.repeat_penalty, float),
                "temperature": (config.temperature, float),
                "seed": (config.seed, int),
                "stop": (config.stop, list),
                "tfsZ": (config.tfs_z, float),
                "numPredict": (config.num_predict, int),
                "topK": (config.top_k, int),
                "topP": (config.top_p, float),
                "minP": (config.min_p, float),
            }

            for key, (param, type_conv) in param_mapping.items():
                value = spec.parameters.get(key)
                if value is not None:
                    param.set(type_conv(value))

        return config