Source code for lm_polygraph.estimators.verbalized_1s

import numpy as np
import re

from typing import Dict

from .estimator import Estimator


[docs]class Verbalized1S(Estimator):
    """
    Estimates sequence-level uncertainty of a language model by extracting
    the confidence estimate from the model's answer using a provided regex.
    To use this estimator, model has to be correctly prompted to output
    it's confidence in the answer.
    Adapted from the original implementation in the paper https://arxiv.org/abs/2305.14975
    """

    def __init__(self, confidence_regex="", name_postfix=""):
        self.confidence_regex = confidence_regex
        self.postfix = name_postfix
        super().__init__(["greedy_texts"], "sequence")

    def __str__(self):
        return f"Verbalized1S{self.postfix}"

    def __call__(self, stats: Dict[str, np.ndarray]) -> np.ndarray:
        ues = []
        conf_re = re.compile(self.confidence_regex)
        for answer in stats["greedy_texts"]:
            match = re.search(conf_re, answer)

            try:
                ue = 1 - float(match.groups()[0])
            except AttributeError:
                ue = np.nan

            ues.append(ue)

        return np.array(ues)