backends

Module to define the backends in charge of creating logits processors.

`BaseBackend`

Bases: ABC

Base class for all backends.

The subclasses must implement methods that create a logits processor from a JSON schema, regex or CFG.

Source code in outlines/backends/base.py

class BaseBackend(ABC):
    """Base class for all backends.

    The subclasses must implement methods that create a logits processor
    from a JSON schema, regex or CFG.

    """

    @abstractmethod
    def get_json_schema_logits_processor(
        self, json_schema: str
    ) -> LogitsProcessorType:
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessorType
            The logits processor.

        """
        ...

    @abstractmethod
    def get_regex_logits_processor(self, regex: str) -> LogitsProcessorType:
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessorType
            The logits processor.

        """
        ...

    @abstractmethod
    def get_cfg_logits_processor(self, grammar: str) -> LogitsProcessorType:
        """Create a logits processor from a context-free grammar.

        Parameters
        ----------
        grammar: str
            The context-free grammar to create a logits processor from.

        Returns
        -------
        LogitsProcessorType
            The logits processor.

        """
        ...

`get_cfg_logits_processor(grammar)` `abstractmethod`

Create a logits processor from a context-free grammar.

Parameters:

Name	Type	Description	Default
`grammar`	`str`	The context-free grammar to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/base.py

@abstractmethod
def get_cfg_logits_processor(self, grammar: str) -> LogitsProcessorType:
    """Create a logits processor from a context-free grammar.

    Parameters
    ----------
    grammar: str
        The context-free grammar to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    ...

`get_json_schema_logits_processor(json_schema)` `abstractmethod`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/base.py

@abstractmethod
def get_json_schema_logits_processor(
    self, json_schema: str
) -> LogitsProcessorType:
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    ...

`get_regex_logits_processor(regex)` `abstractmethod`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/base.py

@abstractmethod
def get_regex_logits_processor(self, regex: str) -> LogitsProcessorType:
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    ...

`LLGuidanceBackend`

Bases: BaseBackend

Backend for LLGuidance.

Source code in outlines/backends/llguidance.py

class LLGuidanceBackend(BaseBackend):
    """Backend for LLGuidance."""

    def __init__(self, model: SteerableModel):
        """
        Parameters
        ----------
        model
            The Outlines model of the user.

        """
        import llguidance as llg

        self.llg = llg
        self.tensor_library_name = model.tensor_library_name
        self.llg_tokenizer = self._create_llg_tokenizer(model)

    def _create_llg_tokenizer(self, model: SteerableModel) -> "LLGTokenizer":
        """Create an llg tokenizer from the Outlines model's tokenizer.

        Parameters
        ----------
        model: Model
            The Outlines model.

        Returns
        -------
        LLGTokenizer
            The llg tokenizer.

        """
        if isinstance(model, Transformers):
            import llguidance.hf

            return llguidance.hf.from_tokenizer(model.hf_tokenizer)

        elif isinstance(model, LlamaCpp):
            import llama_cpp
            import llguidance.llamacpp

            vocab = llama_cpp.llama_model_get_vocab(model.model.model)
            return llguidance.llamacpp.lltokenizer_from_vocab(vocab)

        elif isinstance(model, MLXLM): # pragma: no cover
            import llguidance.hf

            return llguidance.hf.from_tokenizer(
                model.mlx_tokenizer._tokenizer
            )

        else: # pragma: no cover
            raise ValueError(
                f"Unsupported model type: {type(model)}. "
                "Llguidance only supports LlamaCpp, MLXLM "
                "and Transformers models."
            )

    def get_json_schema_logits_processor(
        self, json_schema: str
    ) -> LLGuidanceLogitsProcessor:
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        grammar_spec = self.llg.grammar_from("json_schema", json_schema)
        return LLGuidanceLogitsProcessor(
            grammar_spec, self.llg_tokenizer, self.tensor_library_name
        )

    def get_regex_logits_processor(
        self, regex: str
    ) -> LLGuidanceLogitsProcessor:
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        grammar_spec = self.llg.grammar_from("regex", regex)
        return LLGuidanceLogitsProcessor(
            grammar_spec, self.llg_tokenizer, self.tensor_library_name
        )

    def get_cfg_logits_processor(
        self, grammar: str
    ) -> LLGuidanceLogitsProcessor:
        """Create a logits processor from a context-free grammar.

        Parameters
        ----------
        grammar: str
            The context-free grammar to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        # We try both lark and ebnf
        try:
            grammar_spec = self.llg.grammar_from("grammar", grammar)
        except ValueError:
            grammar_spec = self.llg.grammar_from("lark", grammar)
        return LLGuidanceLogitsProcessor(
            grammar_spec, self.llg_tokenizer, self.tensor_library_name
        )

`init(model)`

Parameters:

Name	Type	Description	Default
`model`	`SteerableModel`	The Outlines model of the user.	required

Source code in outlines/backends/llguidance.py

def __init__(self, model: SteerableModel):
    """
    Parameters
    ----------
    model
        The Outlines model of the user.

    """
    import llguidance as llg

    self.llg = llg
    self.tensor_library_name = model.tensor_library_name
    self.llg_tokenizer = self._create_llg_tokenizer(model)

`get_cfg_logits_processor(grammar)`

Create a logits processor from a context-free grammar.

Parameters:

Name	Type	Description	Default
`grammar`	`str`	The context-free grammar to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/llguidance.py

def get_cfg_logits_processor(
    self, grammar: str
) -> LLGuidanceLogitsProcessor:
    """Create a logits processor from a context-free grammar.

    Parameters
    ----------
    grammar: str
        The context-free grammar to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    # We try both lark and ebnf
    try:
        grammar_spec = self.llg.grammar_from("grammar", grammar)
    except ValueError:
        grammar_spec = self.llg.grammar_from("lark", grammar)
    return LLGuidanceLogitsProcessor(
        grammar_spec, self.llg_tokenizer, self.tensor_library_name
    )

`get_json_schema_logits_processor(json_schema)`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/llguidance.py

def get_json_schema_logits_processor(
    self, json_schema: str
) -> LLGuidanceLogitsProcessor:
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    grammar_spec = self.llg.grammar_from("json_schema", json_schema)
    return LLGuidanceLogitsProcessor(
        grammar_spec, self.llg_tokenizer, self.tensor_library_name
    )

`get_regex_logits_processor(regex)`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/llguidance.py

def get_regex_logits_processor(
    self, regex: str
) -> LLGuidanceLogitsProcessor:
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    grammar_spec = self.llg.grammar_from("regex", regex)
    return LLGuidanceLogitsProcessor(
        grammar_spec, self.llg_tokenizer, self.tensor_library_name
    )

`OutlinesCoreBackend`

Bases: BaseBackend

Backend for Outlines Core.

Source code in outlines/backends/outlines_core.py

class OutlinesCoreBackend(BaseBackend):
    """Backend for Outlines Core."""

    def __init__(self, model: SteerableModel):
        """
        Parameters
        ----------
        model
            The Outlines model of the user.

        """
        if isinstance(model, Transformers):
            tokenizer = model.tokenizer
            vocabulary = tokenizer.get_vocab()
            eos_token_id = tokenizer.eos_token_id
            eos_token = tokenizer.eos_token
            token_to_str = tokenizer.convert_token_to_string
        elif isinstance(model, LlamaCpp):
            tokenizer = model.tokenizer # type: ignore
            vocabulary = tokenizer.vocabulary
            eos_token_id = tokenizer.eos_token_id
            eos_token = tokenizer.eos_token
            token_to_str = tokenizer.convert_token_to_string
        elif isinstance(model, MLXLM): # pragma: no cover
            tokenizer = model.mlx_tokenizer # type: ignore
            vocabulary = tokenizer.get_vocab()
            eos_token_id = tokenizer.eos_token_id
            eos_token = tokenizer.eos_token
            token_to_str = lambda token: tokenizer.convert_tokens_to_string([token]) # type: ignore
        else: # pragma: no cover
            raise ValueError(f"Unsupported model type: {type(model)}")

        self.eos_token_id = eos_token_id
        self.vocabulary = self.create_outlines_core_vocabulary(
            vocabulary, eos_token_id, eos_token, token_to_str
        )
        self.tensor_library_name = model.tensor_library_name

    def get_json_schema_logits_processor(
        self, json_schema: str
    ):
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        regex = outlines_core.json_schema.build_regex_from_schema(json_schema)
        return self.get_regex_logits_processor(regex)

    def get_regex_logits_processor(self, regex: str):
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        index = Index(regex, self.vocabulary)
        return OutlinesCoreLogitsProcessor(index, self.tensor_library_name)

    def get_cfg_logits_processor(self, grammar):
        raise NotImplementedError(
            "Outlines Core does not support context-free grammar."
        )

    @staticmethod
    def create_outlines_core_vocabulary(
        vocab: Dict[str, int],
        eos_token_id: int,
        eos_token: str,
        token_to_str: Callable[[str], str]
    ) -> Vocabulary:
        """Create an Outlines Core Vocabulary instance.

        Parameters
        ----------
        vocab: Dict[str, int]
            The vocabulary to create an Outlines Core vocabulary from.
        eos_token_id: int
            The EOS token ID.
        eos_token: str
            The EOS token.
        token_to_str: Callable[[str], str]
            The function to convert a token to a string.

        Returns
        -------
        Vocabulary
            The Outlines Core Vocabulary instance.

        """
        formatted_vocab = {}
        for token, token_id in vocab.items():
            # This step is necessary to transform special tokens into their
            # string representation, in particular for spacing. We need those
            # string representations as outlines core first builds an FSM from
            # the regex provided that only contains regular strings.
            token_as_str = token_to_str(token)
            formatted_vocab[token_as_str] = [token_id]
        formatted_vocab.pop(eos_token)
        return Vocabulary(eos_token_id, formatted_vocab)

`init(model)`

Parameters:

Name	Type	Description	Default
`model`	`SteerableModel`	The Outlines model of the user.	required

Source code in outlines/backends/outlines_core.py

def __init__(self, model: SteerableModel):
    """
    Parameters
    ----------
    model
        The Outlines model of the user.

    """
    if isinstance(model, Transformers):
        tokenizer = model.tokenizer
        vocabulary = tokenizer.get_vocab()
        eos_token_id = tokenizer.eos_token_id
        eos_token = tokenizer.eos_token
        token_to_str = tokenizer.convert_token_to_string
    elif isinstance(model, LlamaCpp):
        tokenizer = model.tokenizer # type: ignore
        vocabulary = tokenizer.vocabulary
        eos_token_id = tokenizer.eos_token_id
        eos_token = tokenizer.eos_token
        token_to_str = tokenizer.convert_token_to_string
    elif isinstance(model, MLXLM): # pragma: no cover
        tokenizer = model.mlx_tokenizer # type: ignore
        vocabulary = tokenizer.get_vocab()
        eos_token_id = tokenizer.eos_token_id
        eos_token = tokenizer.eos_token
        token_to_str = lambda token: tokenizer.convert_tokens_to_string([token]) # type: ignore
    else: # pragma: no cover
        raise ValueError(f"Unsupported model type: {type(model)}")

    self.eos_token_id = eos_token_id
    self.vocabulary = self.create_outlines_core_vocabulary(
        vocabulary, eos_token_id, eos_token, token_to_str
    )
    self.tensor_library_name = model.tensor_library_name

`create_outlines_core_vocabulary(vocab, eos_token_id, eos_token, token_to_str)` `staticmethod`

Create an Outlines Core Vocabulary instance.

Parameters:

Name	Type	Description	Default
`vocab`	`Dict[str, int]`	The vocabulary to create an Outlines Core vocabulary from.	required
`eos_token_id`	`int`	The EOS token ID.	required
`eos_token`	`str`	The EOS token.	required
`token_to_str`	`Callable[[str], str]`	The function to convert a token to a string.	required

Returns:

Type	Description
`Vocabulary`	The Outlines Core Vocabulary instance.

Source code in outlines/backends/outlines_core.py

@staticmethod
def create_outlines_core_vocabulary(
    vocab: Dict[str, int],
    eos_token_id: int,
    eos_token: str,
    token_to_str: Callable[[str], str]
) -> Vocabulary:
    """Create an Outlines Core Vocabulary instance.

    Parameters
    ----------
    vocab: Dict[str, int]
        The vocabulary to create an Outlines Core vocabulary from.
    eos_token_id: int
        The EOS token ID.
    eos_token: str
        The EOS token.
    token_to_str: Callable[[str], str]
        The function to convert a token to a string.

    Returns
    -------
    Vocabulary
        The Outlines Core Vocabulary instance.

    """
    formatted_vocab = {}
    for token, token_id in vocab.items():
        # This step is necessary to transform special tokens into their
        # string representation, in particular for spacing. We need those
        # string representations as outlines core first builds an FSM from
        # the regex provided that only contains regular strings.
        token_as_str = token_to_str(token)
        formatted_vocab[token_as_str] = [token_id]
    formatted_vocab.pop(eos_token)
    return Vocabulary(eos_token_id, formatted_vocab)

`get_json_schema_logits_processor(json_schema)`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/outlines_core.py

def get_json_schema_logits_processor(
    self, json_schema: str
):
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    regex = outlines_core.json_schema.build_regex_from_schema(json_schema)
    return self.get_regex_logits_processor(regex)

`get_regex_logits_processor(regex)`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/outlines_core.py

def get_regex_logits_processor(self, regex: str):
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    index = Index(regex, self.vocabulary)
    return OutlinesCoreLogitsProcessor(index, self.tensor_library_name)

`XGrammarBackend`

Bases: BaseBackend

Backend for XGrammar.

Source code in outlines/backends/xgrammar.py

class XGrammarBackend(BaseBackend):
    """Backend for XGrammar."""

    def __init__(self, model: SteerableModel):
        """
        Parameters
        ----------
        model
            The Outlines model of the user.

        """
        import xgrammar as xgr

        if isinstance(model, Transformers):
            tokenizer = model.hf_tokenizer
        elif isinstance(model, MLXLM): # pragma: no cover
            tokenizer = model.mlx_tokenizer._tokenizer
        else: # pragma: no cover
            raise ValueError(
                "The xgrammar backend only supports Transformers and "
                + "MLXLM models"
            )

        tokenizer_info = xgr.TokenizerInfo.from_huggingface(
            tokenizer,
            vocab_size=len(tokenizer.get_vocab())
        )
        self.grammar_compiler = xgr.GrammarCompiler(tokenizer_info)
        self.tensor_library_name = model.tensor_library_name

    def get_json_schema_logits_processor(
        self, json_schema: str
    ) -> XGrammarLogitsProcessor:
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        compiled_grammar = self.grammar_compiler.compile_json_schema(
            json_schema
        )
        return XGrammarLogitsProcessor(
            compiled_grammar,
            self.tensor_library_name
        )

    def get_regex_logits_processor(
        self, regex: str
    ) -> XGrammarLogitsProcessor:
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        compiled_grammar = self.grammar_compiler.compile_regex(regex)
        return XGrammarLogitsProcessor(
            compiled_grammar,
            self.tensor_library_name
        )

    def get_cfg_logits_processor(
        self, grammar: str
    ) -> XGrammarLogitsProcessor:
        """Create a logits processor from a context-free grammar.

        Parameters
        ----------
        grammar: str
            The context-free grammar to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        compiled_grammar = self.grammar_compiler.compile_grammar(grammar)
        return XGrammarLogitsProcessor(
            compiled_grammar,
            self.tensor_library_name
        )

`init(model)`

Parameters:

Name	Type	Description	Default
`model`	`SteerableModel`	The Outlines model of the user.	required

Source code in outlines/backends/xgrammar.py

def __init__(self, model: SteerableModel):
    """
    Parameters
    ----------
    model
        The Outlines model of the user.

    """
    import xgrammar as xgr

    if isinstance(model, Transformers):
        tokenizer = model.hf_tokenizer
    elif isinstance(model, MLXLM): # pragma: no cover
        tokenizer = model.mlx_tokenizer._tokenizer
    else: # pragma: no cover
        raise ValueError(
            "The xgrammar backend only supports Transformers and "
            + "MLXLM models"
        )

    tokenizer_info = xgr.TokenizerInfo.from_huggingface(
        tokenizer,
        vocab_size=len(tokenizer.get_vocab())
    )
    self.grammar_compiler = xgr.GrammarCompiler(tokenizer_info)
    self.tensor_library_name = model.tensor_library_name

`get_cfg_logits_processor(grammar)`

Create a logits processor from a context-free grammar.

Parameters:

Name	Type	Description	Default
`grammar`	`str`	The context-free grammar to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/xgrammar.py

def get_cfg_logits_processor(
    self, grammar: str
) -> XGrammarLogitsProcessor:
    """Create a logits processor from a context-free grammar.

    Parameters
    ----------
    grammar: str
        The context-free grammar to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    compiled_grammar = self.grammar_compiler.compile_grammar(grammar)
    return XGrammarLogitsProcessor(
        compiled_grammar,
        self.tensor_library_name
    )

`get_json_schema_logits_processor(json_schema)`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/xgrammar.py

def get_json_schema_logits_processor(
    self, json_schema: str
) -> XGrammarLogitsProcessor:
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    compiled_grammar = self.grammar_compiler.compile_json_schema(
        json_schema
    )
    return XGrammarLogitsProcessor(
        compiled_grammar,
        self.tensor_library_name
    )

`get_regex_logits_processor(regex)`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/xgrammar.py

def get_regex_logits_processor(
    self, regex: str
) -> XGrammarLogitsProcessor:
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    compiled_grammar = self.grammar_compiler.compile_regex(regex)
    return XGrammarLogitsProcessor(
        compiled_grammar,
        self.tensor_library_name
    )

`get_cfg_logits_processor(backend_name, model, grammar)`

Create a logits processor from a context-free grammar.

Parameters:

Name	Type	Description	Default
`backend_name`	`str \| None`	The name of the backend to use.	required
`model`	`SteerableModel`	The Outlines model of the user.	required
`grammar`	`str`	The context-free grammar to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/__init__.py

def get_cfg_logits_processor(
    backend_name: str | None,
    model: SteerableModel,
    grammar: str,
) -> LogitsProcessorType:
    """Create a logits processor from a context-free grammar.

    Parameters
    ----------
    backend_name: str | None
        The name of the backend to use.
    model: Model
        The Outlines model of the user.
    grammar: str
        The context-free grammar to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    backend = _get_backend(
        backend_name or CFG_DEFAULT_BACKEND,
        model,
    )
    return backend.get_cfg_logits_processor(grammar)

`get_json_schema_logits_processor(backend_name, model, json_schema)`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`backend_name`	`str \| None`	The name of the backend to use.	required
`model`	`SteerableModel`	The Outlines model of the user.	required
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/__init__.py

def get_json_schema_logits_processor(
    backend_name: str | None,
    model: SteerableModel,
    json_schema: str,
) -> LogitsProcessorType:
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    backend_name: str | None
        The name of the backend to use.
    model: Model
        The Outlines model of the user.
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    backend = _get_backend(
        backend_name or JSON_SCHEMA_DEFAULT_BACKEND,
        model,
    )
    return backend.get_json_schema_logits_processor(json_schema)

`get_regex_logits_processor(backend_name, model, regex)`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`backend_name`	`str \| None`	The name of the backend to use.	required
`model`	`SteerableModel`	The Outlines model of the user.	required
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/__init__.py

def get_regex_logits_processor(
    backend_name: str | None,
    model: SteerableModel,
    regex: str,
) -> LogitsProcessorType:
    """Create a logits processor from a regex.

    Parameters
    ----------
    backend_name: str | None
        The name of the backend to use.
    model: Model
        The Outlines model of the user.
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    backend = _get_backend(
        backend_name or REGEX_DEFAULT_BACKEND,
        model,
    )
    return backend.get_regex_logits_processor(regex)

`base`

Base class for all backends.

`BaseBackend`

Bases: ABC

Base class for all backends.

The subclasses must implement methods that create a logits processor from a JSON schema, regex or CFG.

Source code in outlines/backends/base.py

class BaseBackend(ABC):
    """Base class for all backends.

    The subclasses must implement methods that create a logits processor
    from a JSON schema, regex or CFG.

    """

    @abstractmethod
    def get_json_schema_logits_processor(
        self, json_schema: str
    ) -> LogitsProcessorType:
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessorType
            The logits processor.

        """
        ...

    @abstractmethod
    def get_regex_logits_processor(self, regex: str) -> LogitsProcessorType:
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessorType
            The logits processor.

        """
        ...

    @abstractmethod
    def get_cfg_logits_processor(self, grammar: str) -> LogitsProcessorType:
        """Create a logits processor from a context-free grammar.

        Parameters
        ----------
        grammar: str
            The context-free grammar to create a logits processor from.

        Returns
        -------
        LogitsProcessorType
            The logits processor.

        """
        ...

`get_cfg_logits_processor(grammar)` `abstractmethod`

Create a logits processor from a context-free grammar.

Parameters:

Name	Type	Description	Default
`grammar`	`str`	The context-free grammar to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/base.py

@abstractmethod
def get_cfg_logits_processor(self, grammar: str) -> LogitsProcessorType:
    """Create a logits processor from a context-free grammar.

    Parameters
    ----------
    grammar: str
        The context-free grammar to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    ...

`get_json_schema_logits_processor(json_schema)` `abstractmethod`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/base.py

@abstractmethod
def get_json_schema_logits_processor(
    self, json_schema: str
) -> LogitsProcessorType:
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    ...

`get_regex_logits_processor(regex)` `abstractmethod`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessorType`	The logits processor.

Source code in outlines/backends/base.py

@abstractmethod
def get_regex_logits_processor(self, regex: str) -> LogitsProcessorType:
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessorType
        The logits processor.

    """
    ...

`llguidance`

Backend class for LLGuidance.

`LLGuidanceBackend`

Bases: BaseBackend

Backend for LLGuidance.

Source code in outlines/backends/llguidance.py

class LLGuidanceBackend(BaseBackend):
    """Backend for LLGuidance."""

    def __init__(self, model: SteerableModel):
        """
        Parameters
        ----------
        model
            The Outlines model of the user.

        """
        import llguidance as llg

        self.llg = llg
        self.tensor_library_name = model.tensor_library_name
        self.llg_tokenizer = self._create_llg_tokenizer(model)

    def _create_llg_tokenizer(self, model: SteerableModel) -> "LLGTokenizer":
        """Create an llg tokenizer from the Outlines model's tokenizer.

        Parameters
        ----------
        model: Model
            The Outlines model.

        Returns
        -------
        LLGTokenizer
            The llg tokenizer.

        """
        if isinstance(model, Transformers):
            import llguidance.hf

            return llguidance.hf.from_tokenizer(model.hf_tokenizer)

        elif isinstance(model, LlamaCpp):
            import llama_cpp
            import llguidance.llamacpp

            vocab = llama_cpp.llama_model_get_vocab(model.model.model)
            return llguidance.llamacpp.lltokenizer_from_vocab(vocab)

        elif isinstance(model, MLXLM): # pragma: no cover
            import llguidance.hf

            return llguidance.hf.from_tokenizer(
                model.mlx_tokenizer._tokenizer
            )

        else: # pragma: no cover
            raise ValueError(
                f"Unsupported model type: {type(model)}. "
                "Llguidance only supports LlamaCpp, MLXLM "
                "and Transformers models."
            )

    def get_json_schema_logits_processor(
        self, json_schema: str
    ) -> LLGuidanceLogitsProcessor:
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        grammar_spec = self.llg.grammar_from("json_schema", json_schema)
        return LLGuidanceLogitsProcessor(
            grammar_spec, self.llg_tokenizer, self.tensor_library_name
        )

    def get_regex_logits_processor(
        self, regex: str
    ) -> LLGuidanceLogitsProcessor:
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        grammar_spec = self.llg.grammar_from("regex", regex)
        return LLGuidanceLogitsProcessor(
            grammar_spec, self.llg_tokenizer, self.tensor_library_name
        )

    def get_cfg_logits_processor(
        self, grammar: str
    ) -> LLGuidanceLogitsProcessor:
        """Create a logits processor from a context-free grammar.

        Parameters
        ----------
        grammar: str
            The context-free grammar to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        # We try both lark and ebnf
        try:
            grammar_spec = self.llg.grammar_from("grammar", grammar)
        except ValueError:
            grammar_spec = self.llg.grammar_from("lark", grammar)
        return LLGuidanceLogitsProcessor(
            grammar_spec, self.llg_tokenizer, self.tensor_library_name
        )

`init(model)`

Parameters:

Name	Type	Description	Default
`model`	`SteerableModel`	The Outlines model of the user.	required

Source code in outlines/backends/llguidance.py

def __init__(self, model: SteerableModel):
    """
    Parameters
    ----------
    model
        The Outlines model of the user.

    """
    import llguidance as llg

    self.llg = llg
    self.tensor_library_name = model.tensor_library_name
    self.llg_tokenizer = self._create_llg_tokenizer(model)

`get_cfg_logits_processor(grammar)`

Create a logits processor from a context-free grammar.

Parameters:

Name	Type	Description	Default
`grammar`	`str`	The context-free grammar to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/llguidance.py

def get_cfg_logits_processor(
    self, grammar: str
) -> LLGuidanceLogitsProcessor:
    """Create a logits processor from a context-free grammar.

    Parameters
    ----------
    grammar: str
        The context-free grammar to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    # We try both lark and ebnf
    try:
        grammar_spec = self.llg.grammar_from("grammar", grammar)
    except ValueError:
        grammar_spec = self.llg.grammar_from("lark", grammar)
    return LLGuidanceLogitsProcessor(
        grammar_spec, self.llg_tokenizer, self.tensor_library_name
    )

`get_json_schema_logits_processor(json_schema)`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/llguidance.py

def get_json_schema_logits_processor(
    self, json_schema: str
) -> LLGuidanceLogitsProcessor:
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    grammar_spec = self.llg.grammar_from("json_schema", json_schema)
    return LLGuidanceLogitsProcessor(
        grammar_spec, self.llg_tokenizer, self.tensor_library_name
    )

`get_regex_logits_processor(regex)`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/llguidance.py

def get_regex_logits_processor(
    self, regex: str
) -> LLGuidanceLogitsProcessor:
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    grammar_spec = self.llg.grammar_from("regex", regex)
    return LLGuidanceLogitsProcessor(
        grammar_spec, self.llg_tokenizer, self.tensor_library_name
    )

`LLGuidanceLogitsProcessor`

Bases: OutlinesLogitsProcessor

Logits Processor for the LLGuidance backend.

Source code in outlines/backends/llguidance.py

class LLGuidanceLogitsProcessor(OutlinesLogitsProcessor):
    """Logits Processor for the LLGuidance backend."""

    def __init__(
        self,
        grammar: str,
        llg_tokenizer,
        tensor_library_name: str,
    ) -> None:
        """
        Parameters
        ----------
        grammar: str
            The grammar spec to use to create the LLMatcher
        llg_tokenizer: LLTokenizer
            The LLGuidance tokenizer
        tensor_library_name: str
            The name of the tensor library used by the model

        """
        self.is_first_token = True
        self.grammar = grammar
        self.llg_tokenizer = llg_tokenizer
        self.tensor_library_name = tensor_library_name
        super().__init__(tensor_library_name)

    def reset(self):
        """Ensure self._setup is called again for the next generation."""
        self.is_first_token = True

    def _setup(self, batch_size: int) -> None:
        """Setup the LLMatchers, the bitmask and some functions used in the
        `process_logits` method.

        This method is called when the first token is generated instead of
        at initialization because we need to know the batch size.

        Parameters
        ----------
        batch_size: int
            The batch size of the input

        """
        from llguidance import LLMatcher

        self.ll_matchers = [
            LLMatcher(self.llg_tokenizer, self.grammar)
            for _ in range(batch_size)
        ]

        # we must adapt the bitmask creation and the bias function to the
        # tensor library used by the model
        if self.tensor_library_name == "torch":
            import llguidance.torch

            self.bitmask = llguidance.torch.allocate_token_bitmask(batch_size, self.llg_tokenizer.vocab_size)
            self._bias_logits = self._bias_logits_torch
        elif self.tensor_library_name == "numpy":
            import llguidance.numpy

            self.bitmask = llguidance.numpy.allocate_token_bitmask(batch_size, self.llg_tokenizer.vocab_size)
            self._bias_logits = self._bias_logits_numpy
        elif self.tensor_library_name == "mlx": # pragma: no cover
            import llguidance.numpy

            self.bitmask = llguidance.numpy.allocate_token_bitmask(batch_size, self.llg_tokenizer.vocab_size)
            self._bias_logits = self._bias_logits_mlx
        else: # pragma: no cover
            raise ValueError(f"Unsupported tensor library: {self.tensor_library_name}")

    def _bias_logits_mlx( # pragma: no cover
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Bias the logits for the MLX backend."""
        import llguidance.mlx
        import llguidance.numpy

        biased_logits_array = []
        for i in range(self.tensor_adapter.shape(input_ids)[0]):
            llguidance.numpy.fill_next_token_bitmask(self.ll_matchers[i], self.bitmask, i)
            biased_logits = llguidance.mlx.apply_token_bitmask(
                logits[i], self.bitmask[i] # type: ignore
            )
            biased_logits_array.append(biased_logits)

        return self.tensor_adapter.concatenate(biased_logits_array)

    def _bias_logits_torch(
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Bias the logits for the Torch backend."""
        import llguidance.torch

        for i in range(self.tensor_adapter.shape(input_ids)[0]):
            llguidance.torch.fill_next_token_bitmask(self.ll_matchers[i], self.bitmask, i)
            self.bitmask = self.tensor_adapter.to_device(
                self.bitmask,
                self.tensor_adapter.get_device(logits)
            )
            llguidance.torch.apply_token_bitmask_inplace(
                logits[i], # type: ignore
                self.bitmask[i]
            )
            self.bitmask = self.tensor_adapter.to_device(
                self.bitmask,
                "cpu"
            )

        return logits

    def _bias_logits_numpy(
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Bias the logits for the Numpy backend."""
        import llguidance.numpy

        for i in range(self.tensor_adapter.shape(input_ids)[0]):
            llguidance.numpy.fill_next_token_bitmask(self.ll_matchers[i], self.bitmask, i)
            llguidance.numpy.apply_token_bitmask_inplace(
                logits[i], self.bitmask[i] # type: ignore
            )

        return logits

    def process_logits(
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Use the instances of LLMatcher to bias the logits.

        Parameters
        ----------
        input_ids
            The ids of the tokens of the existing sequences.
        logits
            The logits for the current generation step.

        Returns
        -------
        TensorType
            The biased logits.

        """
        if self.is_first_token:
            self._setup(self.tensor_adapter.shape(input_ids)[0])
            self.is_first_token = False

        # we do not make the matchers consume the last token during the first
        # generation step because no tokens have been generated yet
        else:
            for i in range(self.tensor_adapter.shape(input_ids)[0]):
                sequence = input_ids[i] # type: ignore
                last_token = sequence[-1].item()
                self.ll_matchers[i].consume_token(last_token)
                error = self.ll_matchers[i].get_error()
                if error:
                    warnings.warn(f"Error in LLMatcher: {error}")

        return self._bias_logits(input_ids, logits)

`init(grammar, llg_tokenizer, tensor_library_name)`

Parameters:

Name	Type	Description	Default
`grammar`	`str`	The grammar spec to use to create the LLMatcher	required
`llg_tokenizer`		The LLGuidance tokenizer	required
`tensor_library_name`	`str`	The name of the tensor library used by the model	required

Source code in outlines/backends/llguidance.py

def __init__(
    self,
    grammar: str,
    llg_tokenizer,
    tensor_library_name: str,
) -> None:
    """
    Parameters
    ----------
    grammar: str
        The grammar spec to use to create the LLMatcher
    llg_tokenizer: LLTokenizer
        The LLGuidance tokenizer
    tensor_library_name: str
        The name of the tensor library used by the model

    """
    self.is_first_token = True
    self.grammar = grammar
    self.llg_tokenizer = llg_tokenizer
    self.tensor_library_name = tensor_library_name
    super().__init__(tensor_library_name)

`process_logits(input_ids, logits)`

Use the instances of LLMatcher to bias the logits.

Parameters:

Name	Type	Description	Default
`input_ids`	`TensorType`	The ids of the tokens of the existing sequences.	required
`logits`	`TensorType`	The logits for the current generation step.	required

Returns:

Type	Description
`TensorType`	The biased logits.

Source code in outlines/backends/llguidance.py

def process_logits(
    self, input_ids: TensorType, logits: TensorType
) -> TensorType:
    """Use the instances of LLMatcher to bias the logits.

    Parameters
    ----------
    input_ids
        The ids of the tokens of the existing sequences.
    logits
        The logits for the current generation step.

    Returns
    -------
    TensorType
        The biased logits.

    """
    if self.is_first_token:
        self._setup(self.tensor_adapter.shape(input_ids)[0])
        self.is_first_token = False

    # we do not make the matchers consume the last token during the first
    # generation step because no tokens have been generated yet
    else:
        for i in range(self.tensor_adapter.shape(input_ids)[0]):
            sequence = input_ids[i] # type: ignore
            last_token = sequence[-1].item()
            self.ll_matchers[i].consume_token(last_token)
            error = self.ll_matchers[i].get_error()
            if error:
                warnings.warn(f"Error in LLMatcher: {error}")

    return self._bias_logits(input_ids, logits)

`reset()`

Ensure self._setup is called again for the next generation.

Source code in outlines/backends/llguidance.py

46
47
48

def reset(self):
    """Ensure self._setup is called again for the next generation."""
    self.is_first_token = True

`outlines_core`

Backend class for Outlines Core.

`OutlinesCoreBackend`

Bases: BaseBackend

Backend for Outlines Core.

Source code in outlines/backends/outlines_core.py

class OutlinesCoreBackend(BaseBackend):
    """Backend for Outlines Core."""

    def __init__(self, model: SteerableModel):
        """
        Parameters
        ----------
        model
            The Outlines model of the user.

        """
        if isinstance(model, Transformers):
            tokenizer = model.tokenizer
            vocabulary = tokenizer.get_vocab()
            eos_token_id = tokenizer.eos_token_id
            eos_token = tokenizer.eos_token
            token_to_str = tokenizer.convert_token_to_string
        elif isinstance(model, LlamaCpp):
            tokenizer = model.tokenizer # type: ignore
            vocabulary = tokenizer.vocabulary
            eos_token_id = tokenizer.eos_token_id
            eos_token = tokenizer.eos_token
            token_to_str = tokenizer.convert_token_to_string
        elif isinstance(model, MLXLM): # pragma: no cover
            tokenizer = model.mlx_tokenizer # type: ignore
            vocabulary = tokenizer.get_vocab()
            eos_token_id = tokenizer.eos_token_id
            eos_token = tokenizer.eos_token
            token_to_str = lambda token: tokenizer.convert_tokens_to_string([token]) # type: ignore
        else: # pragma: no cover
            raise ValueError(f"Unsupported model type: {type(model)}")

        self.eos_token_id = eos_token_id
        self.vocabulary = self.create_outlines_core_vocabulary(
            vocabulary, eos_token_id, eos_token, token_to_str
        )
        self.tensor_library_name = model.tensor_library_name

    def get_json_schema_logits_processor(
        self, json_schema: str
    ):
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        regex = outlines_core.json_schema.build_regex_from_schema(json_schema)
        return self.get_regex_logits_processor(regex)

    def get_regex_logits_processor(self, regex: str):
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        index = Index(regex, self.vocabulary)
        return OutlinesCoreLogitsProcessor(index, self.tensor_library_name)

    def get_cfg_logits_processor(self, grammar):
        raise NotImplementedError(
            "Outlines Core does not support context-free grammar."
        )

    @staticmethod
    def create_outlines_core_vocabulary(
        vocab: Dict[str, int],
        eos_token_id: int,
        eos_token: str,
        token_to_str: Callable[[str], str]
    ) -> Vocabulary:
        """Create an Outlines Core Vocabulary instance.

        Parameters
        ----------
        vocab: Dict[str, int]
            The vocabulary to create an Outlines Core vocabulary from.
        eos_token_id: int
            The EOS token ID.
        eos_token: str
            The EOS token.
        token_to_str: Callable[[str], str]
            The function to convert a token to a string.

        Returns
        -------
        Vocabulary
            The Outlines Core Vocabulary instance.

        """
        formatted_vocab = {}
        for token, token_id in vocab.items():
            # This step is necessary to transform special tokens into their
            # string representation, in particular for spacing. We need those
            # string representations as outlines core first builds an FSM from
            # the regex provided that only contains regular strings.
            token_as_str = token_to_str(token)
            formatted_vocab[token_as_str] = [token_id]
        formatted_vocab.pop(eos_token)
        return Vocabulary(eos_token_id, formatted_vocab)

`init(model)`

Parameters:

Name	Type	Description	Default
`model`	`SteerableModel`	The Outlines model of the user.	required

Source code in outlines/backends/outlines_core.py

def __init__(self, model: SteerableModel):
    """
    Parameters
    ----------
    model
        The Outlines model of the user.

    """
    if isinstance(model, Transformers):
        tokenizer = model.tokenizer
        vocabulary = tokenizer.get_vocab()
        eos_token_id = tokenizer.eos_token_id
        eos_token = tokenizer.eos_token
        token_to_str = tokenizer.convert_token_to_string
    elif isinstance(model, LlamaCpp):
        tokenizer = model.tokenizer # type: ignore
        vocabulary = tokenizer.vocabulary
        eos_token_id = tokenizer.eos_token_id
        eos_token = tokenizer.eos_token
        token_to_str = tokenizer.convert_token_to_string
    elif isinstance(model, MLXLM): # pragma: no cover
        tokenizer = model.mlx_tokenizer # type: ignore
        vocabulary = tokenizer.get_vocab()
        eos_token_id = tokenizer.eos_token_id
        eos_token = tokenizer.eos_token
        token_to_str = lambda token: tokenizer.convert_tokens_to_string([token]) # type: ignore
    else: # pragma: no cover
        raise ValueError(f"Unsupported model type: {type(model)}")

    self.eos_token_id = eos_token_id
    self.vocabulary = self.create_outlines_core_vocabulary(
        vocabulary, eos_token_id, eos_token, token_to_str
    )
    self.tensor_library_name = model.tensor_library_name

`create_outlines_core_vocabulary(vocab, eos_token_id, eos_token, token_to_str)` `staticmethod`

Create an Outlines Core Vocabulary instance.

Parameters:

Name	Type	Description	Default
`vocab`	`Dict[str, int]`	The vocabulary to create an Outlines Core vocabulary from.	required
`eos_token_id`	`int`	The EOS token ID.	required
`eos_token`	`str`	The EOS token.	required
`token_to_str`	`Callable[[str], str]`	The function to convert a token to a string.	required

Returns:

Type	Description
`Vocabulary`	The Outlines Core Vocabulary instance.

Source code in outlines/backends/outlines_core.py

@staticmethod
def create_outlines_core_vocabulary(
    vocab: Dict[str, int],
    eos_token_id: int,
    eos_token: str,
    token_to_str: Callable[[str], str]
) -> Vocabulary:
    """Create an Outlines Core Vocabulary instance.

    Parameters
    ----------
    vocab: Dict[str, int]
        The vocabulary to create an Outlines Core vocabulary from.
    eos_token_id: int
        The EOS token ID.
    eos_token: str
        The EOS token.
    token_to_str: Callable[[str], str]
        The function to convert a token to a string.

    Returns
    -------
    Vocabulary
        The Outlines Core Vocabulary instance.

    """
    formatted_vocab = {}
    for token, token_id in vocab.items():
        # This step is necessary to transform special tokens into their
        # string representation, in particular for spacing. We need those
        # string representations as outlines core first builds an FSM from
        # the regex provided that only contains regular strings.
        token_as_str = token_to_str(token)
        formatted_vocab[token_as_str] = [token_id]
    formatted_vocab.pop(eos_token)
    return Vocabulary(eos_token_id, formatted_vocab)

`get_json_schema_logits_processor(json_schema)`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/outlines_core.py

def get_json_schema_logits_processor(
    self, json_schema: str
):
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    regex = outlines_core.json_schema.build_regex_from_schema(json_schema)
    return self.get_regex_logits_processor(regex)

`get_regex_logits_processor(regex)`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/outlines_core.py

def get_regex_logits_processor(self, regex: str):
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    index = Index(regex, self.vocabulary)
    return OutlinesCoreLogitsProcessor(index, self.tensor_library_name)

`OutlinesCoreLogitsProcessor`

Bases: OutlinesLogitsProcessor

Logits processor for Outlines Core.

Source code in outlines/backends/outlines_core.py

class OutlinesCoreLogitsProcessor(OutlinesLogitsProcessor):
    """Logits processor for Outlines Core."""

    def __init__(
        self, index: Index, tensor_library_name: str
    ):
        """
        Parameters
        ----------
        index: Index
            The Outlines Core `Index` instance to use to create the Outlines
            Core `Guide` instances that will be used to bias the logits
        tensor_library_name: str
            The tensor library name to use for the logits processor.

        """
        self.index = index
        self.tensor_library_name = tensor_library_name
        self.is_first_token = True
        super().__init__(tensor_library_name)

    def reset(self) -> None:
        """Reset the logits processor."""
        self.is_first_token = True

    def _setup(self, batch_size: int, vocab_size: int) -> None:
        """Set the guides, bitmasks and some functions used in the
        `process_logits` method.

        This method is called when the first token is generated instead of
        at initialization because we need to know the batch size and the device
        of the logits.

        Parameters
        ----------
        batch_size: int
            The batch size.
        vocab_size: int
            The vocabulary size.

        """
        if self.tensor_library_name == "torch":
            from outlines_core.kernels.torch import allocate_token_bitmask

            self.allocate_token_bitmask = allocate_token_bitmask
            self.bias_logits = self._bias_logits_torch

        elif self.tensor_library_name == "numpy":
            from outlines_core.kernels.numpy import allocate_token_bitmask

            self.allocate_token_bitmask = allocate_token_bitmask
            self.bias_logits = self._bias_logits_numpy

        elif self.tensor_library_name == "mlx": # pragma: no cover
            from outlines_core.kernels.mlx import (
                allocate_token_bitmask
            )

            self.allocate_token_bitmask = allocate_token_bitmask
            self.bias_logits = self._bias_logits_mlx

        else: # pragma: no cover
            raise ValueError(
                f"Unsupported tensor library: {self.tensor_library_name}"
            )

        self._guides = [Guide(self.index) for _ in range(batch_size)]
        self._bitmasks = [
            self.allocate_token_bitmask(vocab_size)
            for _ in range(batch_size)
        ]

    def _bias_logits_mlx( # pragma: no cover
        self, batch_size: int, logits: TensorType
    ) -> TensorType:
        """Bias the logits for MLX tensors."""
        from outlines_core.kernels.mlx import (
            apply_token_bitmask,
            fill_next_token_bitmask
        )

        biased_logits_array = []
        for i in range(batch_size):
            fill_next_token_bitmask(self._guides[i], self._bitmasks[i])
            biased_logits = apply_token_bitmask(
                self.tensor_adapter.unsqueeze(logits[i]), self._bitmasks[i] # type: ignore
            )
            biased_logits_array.append(biased_logits)

        return self.tensor_adapter.concatenate(biased_logits_array)

    def _bias_logits_torch(
        self, batch_size: int, logits: TensorType
    ) -> TensorType:
        """Bias the logits for Torch tensors."""
        from outlines_core.kernels.torch import (
            apply_token_bitmask_inplace,
            fill_next_token_bitmask
        )

        for i in range(batch_size):
            fill_next_token_bitmask(self._guides[i], self._bitmasks[i])
            self._bitmasks[i] = self.tensor_adapter.to_device(
                self._bitmasks[i],
                self.tensor_adapter.get_device(logits)
            )
            apply_token_bitmask_inplace(
                self.tensor_adapter.unsqueeze(logits[i]), # type: ignore
                self._bitmasks[i]
            )
            self._bitmasks[i] = self.tensor_adapter.to_device(
                self._bitmasks[i],
                "cpu"
            )

        return logits

    def _bias_logits_numpy(
        self, batch_size: int, logits: TensorType
    ) -> TensorType:
        """Bias the logits for Numpy tensors."""
        from outlines_core.kernels.numpy import (
            apply_token_bitmask_inplace,
            fill_next_token_bitmask
        )

        for i in range(batch_size):
            fill_next_token_bitmask(self._guides[i], self._bitmasks[i])
            apply_token_bitmask_inplace(
                self.tensor_adapter.unsqueeze(logits[i]), # type: ignore
                self._bitmasks[i]
            )

        return logits

    def process_logits(
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Use the guides to bias the logits.

        Parameters
        ----------
        input_ids
            The ids of the tokens of the existing sequences.
        logits
            The logits for the current generation step.

        Returns
        -------
        TensorType
            The biased logits.

        """
        batch_size = self.tensor_adapter.shape(input_ids)[0]
        vocab_size = self.tensor_adapter.shape(logits)[1]

        if self.is_first_token:
            self._setup(batch_size, vocab_size)
            self.is_first_token = False
        else:
            for i in range(batch_size):
                last_token_id = self.tensor_adapter.to_scalar(input_ids[i][-1]) # type: ignore
                # This circumvents issue #227 in outlines_core
                # Ideally, we would be able to advance all the times as the final
                # state would accept the eos token leading to itself
                if (
                    not self._guides[i].is_finished()
                    or self._guides[i].accepts_tokens([last_token_id])
                ):
                    self._guides[i].advance(
                        token_id=last_token_id,
                        return_tokens=False
                    )

        return self.bias_logits(batch_size, logits)

`init(index, tensor_library_name)`

Parameters:

Name	Type	Description	Default
`index`	`Index`	The Outlines Core `Index` instance to use to create the Outlines Core `Guide` instances that will be used to bias the logits	required
`tensor_library_name`	`str`	The tensor library name to use for the logits processor.	required

Source code in outlines/backends/outlines_core.py

def __init__(
    self, index: Index, tensor_library_name: str
):
    """
    Parameters
    ----------
    index: Index
        The Outlines Core `Index` instance to use to create the Outlines
        Core `Guide` instances that will be used to bias the logits
    tensor_library_name: str
        The tensor library name to use for the logits processor.

    """
    self.index = index
    self.tensor_library_name = tensor_library_name
    self.is_first_token = True
    super().__init__(tensor_library_name)

`process_logits(input_ids, logits)`

Use the guides to bias the logits.

Parameters:

Name	Type	Description	Default
`input_ids`	`TensorType`	The ids of the tokens of the existing sequences.	required
`logits`	`TensorType`	The logits for the current generation step.	required

Returns:

Type	Description
`TensorType`	The biased logits.

Source code in outlines/backends/outlines_core.py

def process_logits(
    self, input_ids: TensorType, logits: TensorType
) -> TensorType:
    """Use the guides to bias the logits.

    Parameters
    ----------
    input_ids
        The ids of the tokens of the existing sequences.
    logits
        The logits for the current generation step.

    Returns
    -------
    TensorType
        The biased logits.

    """
    batch_size = self.tensor_adapter.shape(input_ids)[0]
    vocab_size = self.tensor_adapter.shape(logits)[1]

    if self.is_first_token:
        self._setup(batch_size, vocab_size)
        self.is_first_token = False
    else:
        for i in range(batch_size):
            last_token_id = self.tensor_adapter.to_scalar(input_ids[i][-1]) # type: ignore
            # This circumvents issue #227 in outlines_core
            # Ideally, we would be able to advance all the times as the final
            # state would accept the eos token leading to itself
            if (
                not self._guides[i].is_finished()
                or self._guides[i].accepts_tokens([last_token_id])
            ):
                self._guides[i].advance(
                    token_id=last_token_id,
                    return_tokens=False
                )

    return self.bias_logits(batch_size, logits)

`reset()`

Reset the logits processor.

Source code in outlines/backends/outlines_core.py

41
42
43

def reset(self) -> None:
    """Reset the logits processor."""
    self.is_first_token = True

`xgrammar`

Backend class for XGrammar.

`XGrammarBackend`

Bases: BaseBackend

Backend for XGrammar.

Source code in outlines/backends/xgrammar.py

class XGrammarBackend(BaseBackend):
    """Backend for XGrammar."""

    def __init__(self, model: SteerableModel):
        """
        Parameters
        ----------
        model
            The Outlines model of the user.

        """
        import xgrammar as xgr

        if isinstance(model, Transformers):
            tokenizer = model.hf_tokenizer
        elif isinstance(model, MLXLM): # pragma: no cover
            tokenizer = model.mlx_tokenizer._tokenizer
        else: # pragma: no cover
            raise ValueError(
                "The xgrammar backend only supports Transformers and "
                + "MLXLM models"
            )

        tokenizer_info = xgr.TokenizerInfo.from_huggingface(
            tokenizer,
            vocab_size=len(tokenizer.get_vocab())
        )
        self.grammar_compiler = xgr.GrammarCompiler(tokenizer_info)
        self.tensor_library_name = model.tensor_library_name

    def get_json_schema_logits_processor(
        self, json_schema: str
    ) -> XGrammarLogitsProcessor:
        """Create a logits processor from a JSON schema.

        Parameters
        ----------
        json_schema: str
            The JSON schema to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        compiled_grammar = self.grammar_compiler.compile_json_schema(
            json_schema
        )
        return XGrammarLogitsProcessor(
            compiled_grammar,
            self.tensor_library_name
        )

    def get_regex_logits_processor(
        self, regex: str
    ) -> XGrammarLogitsProcessor:
        """Create a logits processor from a regex.

        Parameters
        ----------
        regex: str
            The regex to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        compiled_grammar = self.grammar_compiler.compile_regex(regex)
        return XGrammarLogitsProcessor(
            compiled_grammar,
            self.tensor_library_name
        )

    def get_cfg_logits_processor(
        self, grammar: str
    ) -> XGrammarLogitsProcessor:
        """Create a logits processor from a context-free grammar.

        Parameters
        ----------
        grammar: str
            The context-free grammar to create a logits processor from.

        Returns
        -------
        LogitsProcessor
            The logits processor to use to constrain the generation.

        """
        compiled_grammar = self.grammar_compiler.compile_grammar(grammar)
        return XGrammarLogitsProcessor(
            compiled_grammar,
            self.tensor_library_name
        )

`init(model)`

Parameters:

Name	Type	Description	Default
`model`	`SteerableModel`	The Outlines model of the user.	required

Source code in outlines/backends/xgrammar.py

def __init__(self, model: SteerableModel):
    """
    Parameters
    ----------
    model
        The Outlines model of the user.

    """
    import xgrammar as xgr

    if isinstance(model, Transformers):
        tokenizer = model.hf_tokenizer
    elif isinstance(model, MLXLM): # pragma: no cover
        tokenizer = model.mlx_tokenizer._tokenizer
    else: # pragma: no cover
        raise ValueError(
            "The xgrammar backend only supports Transformers and "
            + "MLXLM models"
        )

    tokenizer_info = xgr.TokenizerInfo.from_huggingface(
        tokenizer,
        vocab_size=len(tokenizer.get_vocab())
    )
    self.grammar_compiler = xgr.GrammarCompiler(tokenizer_info)
    self.tensor_library_name = model.tensor_library_name

`get_cfg_logits_processor(grammar)`

Create a logits processor from a context-free grammar.

Parameters:

Name	Type	Description	Default
`grammar`	`str`	The context-free grammar to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/xgrammar.py

def get_cfg_logits_processor(
    self, grammar: str
) -> XGrammarLogitsProcessor:
    """Create a logits processor from a context-free grammar.

    Parameters
    ----------
    grammar: str
        The context-free grammar to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    compiled_grammar = self.grammar_compiler.compile_grammar(grammar)
    return XGrammarLogitsProcessor(
        compiled_grammar,
        self.tensor_library_name
    )

`get_json_schema_logits_processor(json_schema)`

Create a logits processor from a JSON schema.

Parameters:

Name	Type	Description	Default
`json_schema`	`str`	The JSON schema to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/xgrammar.py

def get_json_schema_logits_processor(
    self, json_schema: str
) -> XGrammarLogitsProcessor:
    """Create a logits processor from a JSON schema.

    Parameters
    ----------
    json_schema: str
        The JSON schema to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    compiled_grammar = self.grammar_compiler.compile_json_schema(
        json_schema
    )
    return XGrammarLogitsProcessor(
        compiled_grammar,
        self.tensor_library_name
    )

`get_regex_logits_processor(regex)`

Create a logits processor from a regex.

Parameters:

Name	Type	Description	Default
`regex`	`str`	The regex to create a logits processor from.	required

Returns:

Type	Description
`LogitsProcessor`	The logits processor to use to constrain the generation.

Source code in outlines/backends/xgrammar.py

def get_regex_logits_processor(
    self, regex: str
) -> XGrammarLogitsProcessor:
    """Create a logits processor from a regex.

    Parameters
    ----------
    regex: str
        The regex to create a logits processor from.

    Returns
    -------
    LogitsProcessor
        The logits processor to use to constrain the generation.

    """
    compiled_grammar = self.grammar_compiler.compile_regex(regex)
    return XGrammarLogitsProcessor(
        compiled_grammar,
        self.tensor_library_name
    )

`XGrammarLogitsProcessor`

Bases: OutlinesLogitsProcessor

Logits processor for XGrammar.

Source code in outlines/backends/xgrammar.py

class XGrammarLogitsProcessor(OutlinesLogitsProcessor):
    """Logits processor for XGrammar."""

    def __init__(self, compiled_grammar: str, tensor_library_name: str,):
        """
        Parameters
        ----------
        compiled_grammar: str
            The compiled grammar to use to create the logits processor.
        tensor_library_name: str
            The name of the tensor library used by the model

        """
        import xgrammar as xgr

        self.xgr = xgr
        self.is_first_token = True
        self.compiled_grammar = compiled_grammar
        self.tensor_library_name = tensor_library_name
        super().__init__(tensor_library_name)

    def reset(self):
        """Ensure self._setup is called again for the next generation."""
        self.is_first_token = True

    def _setup(self, batch_size: int, vocab_size: int) -> None:
        """Setup the logits processor for a new generation."""
        if self.tensor_library_name == "torch":
            self._bias_logits = self._bias_logits_torch
        elif self.tensor_library_name == "mlx": # pragma: no cover
            self._bias_logits = self._bias_logits_mlx
        else: # pragma: no cover
            raise ValueError(
                f"Unsupported tensor library: {self.tensor_library_name}"
            )

        self._matchers = [
            self.xgr.GrammarMatcher(self.compiled_grammar)
            for _ in range(batch_size)
        ]
        self._bitmask = self.xgr.allocate_token_bitmask(batch_size, vocab_size)

    def _bias_logits_torch(
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Bias the logits for Torch tensors."""
        for i in range(self.tensor_adapter.shape(input_ids)[0]):
            if not self._matchers[i].is_terminated():
                self._matchers[i].fill_next_token_bitmask(self._bitmask, i)

        self._bitmask = self.tensor_adapter.to_device(
            self._bitmask,
            self.tensor_adapter.get_device(logits)
        )
        self.xgr.apply_token_bitmask_inplace(logits, self._bitmask)
        self._bitmask = self.tensor_adapter.to_device(
            self._bitmask,
            "cpu"
        )

        return logits

    def _bias_logits_mlx( # pragma: no cover
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Bias the logits for MLX tensors."""
        import mlx.core as mx
        from xgrammar.kernels.apply_token_bitmask_mlx import apply_token_bitmask_mlx

        for i in range(self.tensor_adapter.shape(input_ids)[0]):
            if not self._matchers[i].is_terminated():
                self._matchers[i].fill_next_token_bitmask(self._bitmask, i)

        biased_logits = apply_token_bitmask_mlx(
            mx.array(self._bitmask.numpy()), logits, self.tensor_adapter.shape(logits)[1]
        )

        return biased_logits

    def process_logits(
        self, input_ids: TensorType, logits: TensorType
    ) -> TensorType:
        """Use the XGrammar matchers to bias the logits."""
        batch_size = self.tensor_adapter.shape(input_ids)[0]
        vocab_size = self.tensor_adapter.shape(logits)[1]

        if self.is_first_token:
            self._setup(batch_size, vocab_size)
            self.is_first_token = False
        else:
            for i in range(batch_size):
                if not self._matchers[i].is_terminated(): # pragma: no cover
                    last_token_id = self.tensor_adapter.to_scalar(
                        input_ids[i][-1] # type: ignore
                    )
                    assert self._matchers[i].accept_token(last_token_id)

        return self._bias_logits(input_ids, logits)

`init(compiled_grammar, tensor_library_name)`

Parameters:

Name	Type	Description	Default
`compiled_grammar`	`str`	The compiled grammar to use to create the logits processor.	required
`tensor_library_name`	`str`	The name of the tensor library used by the model	required

Source code in outlines/backends/xgrammar.py

def __init__(self, compiled_grammar: str, tensor_library_name: str,):
    """
    Parameters
    ----------
    compiled_grammar: str
        The compiled grammar to use to create the logits processor.
    tensor_library_name: str
        The name of the tensor library used by the model

    """
    import xgrammar as xgr

    self.xgr = xgr
    self.is_first_token = True
    self.compiled_grammar = compiled_grammar
    self.tensor_library_name = tensor_library_name
    super().__init__(tensor_library_name)

`process_logits(input_ids, logits)`

Use the XGrammar matchers to bias the logits.

Source code in outlines/backends/xgrammar.py

def process_logits(
    self, input_ids: TensorType, logits: TensorType
) -> TensorType:
    """Use the XGrammar matchers to bias the logits."""
    batch_size = self.tensor_adapter.shape(input_ids)[0]
    vocab_size = self.tensor_adapter.shape(logits)[1]

    if self.is_first_token:
        self._setup(batch_size, vocab_size)
        self.is_first_token = False
    else:
        for i in range(batch_size):
            if not self._matchers[i].is_terminated(): # pragma: no cover
                last_token_id = self.tensor_adapter.to_scalar(
                    input_ids[i][-1] # type: ignore
                )
                assert self._matchers[i].accept_token(last_token_id)

    return self._bias_logits(input_ids, logits)

`reset()`

Ensure self._setup is called again for the next generation.

Source code in outlines/backends/xgrammar.py

34
35
36

def reset(self):
    """Ensure self._setup is called again for the next generation."""
    self.is_first_token = True

backends

BaseBackend

get_cfg_logits_processor(grammar) abstractmethod

get_json_schema_logits_processor(json_schema) abstractmethod

get_regex_logits_processor(regex) abstractmethod

LLGuidanceBackend

__init__(model)

get_cfg_logits_processor(grammar)

get_json_schema_logits_processor(json_schema)

get_regex_logits_processor(regex)

OutlinesCoreBackend

__init__(model)

create_outlines_core_vocabulary(vocab, eos_token_id, eos_token, token_to_str) staticmethod

get_json_schema_logits_processor(json_schema)

get_regex_logits_processor(regex)

XGrammarBackend

__init__(model)

get_cfg_logits_processor(grammar)

get_json_schema_logits_processor(json_schema)

get_regex_logits_processor(regex)

get_cfg_logits_processor(backend_name, model, grammar)

get_json_schema_logits_processor(backend_name, model, json_schema)

get_regex_logits_processor(backend_name, model, regex)

base

BaseBackend

get_cfg_logits_processor(grammar) abstractmethod

get_json_schema_logits_processor(json_schema) abstractmethod

get_regex_logits_processor(regex) abstractmethod

llguidance

LLGuidanceBackend

__init__(model)

get_cfg_logits_processor(grammar)

get_json_schema_logits_processor(json_schema)

get_regex_logits_processor(regex)

LLGuidanceLogitsProcessor

__init__(grammar, llg_tokenizer, tensor_library_name)

process_logits(input_ids, logits)

reset()

outlines_core

OutlinesCoreBackend

__init__(model)

create_outlines_core_vocabulary(vocab, eos_token_id, eos_token, token_to_str) staticmethod

get_json_schema_logits_processor(json_schema)

get_regex_logits_processor(regex)

OutlinesCoreLogitsProcessor

__init__(index, tensor_library_name)

process_logits(input_ids, logits)

reset()

xgrammar

XGrammarBackend

__init__(model)

get_cfg_logits_processor(grammar)

get_json_schema_logits_processor(json_schema)

get_regex_logits_processor(regex)

XGrammarLogitsProcessor

__init__(compiled_grammar, tensor_library_name)

process_logits(input_ids, logits)

reset()

`BaseBackend`

`get_cfg_logits_processor(grammar)` `abstractmethod`

`get_json_schema_logits_processor(json_schema)` `abstractmethod`

`get_regex_logits_processor(regex)` `abstractmethod`

`LLGuidanceBackend`

`init(model)`

`get_cfg_logits_processor(grammar)`

`get_json_schema_logits_processor(json_schema)`

`get_regex_logits_processor(regex)`

`OutlinesCoreBackend`

`init(model)`

`create_outlines_core_vocabulary(vocab, eos_token_id, eos_token, token_to_str)` `staticmethod`

`get_json_schema_logits_processor(json_schema)`

`get_regex_logits_processor(regex)`

`XGrammarBackend`

`init(model)`

`get_cfg_logits_processor(grammar)`

`get_json_schema_logits_processor(json_schema)`

`get_regex_logits_processor(regex)`

`get_cfg_logits_processor(backend_name, model, grammar)`

`get_json_schema_logits_processor(backend_name, model, json_schema)`

`get_regex_logits_processor(backend_name, model, regex)`

`base`

`BaseBackend`

`get_cfg_logits_processor(grammar)` `abstractmethod`

`get_json_schema_logits_processor(json_schema)` `abstractmethod`

`get_regex_logits_processor(regex)` `abstractmethod`

`llguidance`

`LLGuidanceBackend`

`init(model)`

`get_cfg_logits_processor(grammar)`

`get_json_schema_logits_processor(json_schema)`

`get_regex_logits_processor(regex)`

`LLGuidanceLogitsProcessor`

`init(grammar, llg_tokenizer, tensor_library_name)`

`process_logits(input_ids, logits)`

`reset()`

`outlines_core`

`OutlinesCoreBackend`

`init(model)`

`create_outlines_core_vocabulary(vocab, eos_token_id, eos_token, token_to_str)` `staticmethod`

`get_json_schema_logits_processor(json_schema)`

`get_regex_logits_processor(regex)`

`OutlinesCoreLogitsProcessor`

`init(index, tensor_library_name)`

`process_logits(input_ids, logits)`

`reset()`

`xgrammar`

`XGrammarBackend`

`init(model)`

`get_cfg_logits_processor(grammar)`

`get_json_schema_logits_processor(json_schema)`

`get_regex_logits_processor(regex)`

`XGrammarLogitsProcessor`

`init(compiled_grammar, tensor_library_name)`

`process_logits(input_ids, logits)`

`reset()`