Source code for eval.functional

from typing import List, Tuple
import numpy as np



[docs]
def confidence_interval(
    judgements: List[float], confidence: float = 0.95
) -> Tuple[float, float]:
    """
    Calculate the confidence interval for a list of binary judgments.

    Args:
        judgements (List[float]): List of binary judgments (1/0).
        confidence (float): Confidence level (default 0.95).

    Returns:
        tuple: Lower and upper bounds of the confidence interval.
    """
    if not isinstance(judgements, list):
        raise ValueError("judgements must be a list")

    if not all(isinstance(j, (int, float)) for j in judgements):
        raise ValueError("judgements must contain only integers or floats")

    if not isinstance(confidence, (int, float)):
        raise ValueError("confidence must be a number")

    if not 0 < confidence < 1:
        raise ValueError("confidence must be between 0 and 1")

    # Step 1: Calculate the mean
    mean_score = np.mean(judgements)

    # Step 2: Calculate the standard error (SE)
    standard_error = np.std(judgements, ddof=1) / np.sqrt(len(judgements))

    # Step 3: Use the Z-critical value for the confidence interval based on confidence level
    z_critical = np.percentile(
        np.random.normal(0, 1, 1000000), 100 * (1 - (1 - confidence) / 2)
    )

    # Step 4: Calculate the margin of error (MoE)
    margin_of_error = z_critical * standard_error

    # Step 5: Calculate the confidence interval
    # Confidence interval (clipped to [0, 1])
    lower_bound = max(0, mean_score - margin_of_error)
    upper_bound = min(1, mean_score + margin_of_error)

    return (lower_bound, upper_bound)




[docs]
def longest_common_substring(s1: str, s2: str) -> str:
    """
    Find the longest common substring between two strings.
    """
    # Create a matrix to store lengths of longest common suffixes of substrings
    # Initialize all values to 0
    m, n = len(s1), len(s2)
    lcs_matrix = [[0] * (n + 1) for _ in range(m + 1)]

    # Variable to store the length of the longest common substring
    longest_length = 0
    # Variable to store the ending index of the longest common substring in s1
    ending_index_s1 = 0

    # Build the matrix in a bottom-up manner
    for i in range(1, m + 1):
        for j in range(1, n + 1):
            if s1[i - 1] == s2[j - 1]:
                lcs_matrix[i][j] = lcs_matrix[i - 1][j - 1] + 1
                if lcs_matrix[i][j] > longest_length:
                    longest_length = lcs_matrix[i][j]
                    ending_index_s1 = i - 1
            else:
                lcs_matrix[i][j] = 0

    # The longest common substring
    longest_common_substring = s1[
        ending_index_s1 - longest_length + 1 : ending_index_s1 + 1
    ]

    return longest_common_substring



if __name__ == "__main__":
    # Example binary judgments (True/False as 1/0)
    judgements = [1, 1, 0, 1, 0, 1, 1]  # Convert to 1/0
    score_range = confidence_interval(judgements, confidence=0.96)
    print(score_range)

    # Example longest common substring
    s1 = "abcdfghijk"
    s2 = "abedfghxyz"
    cs = longest_common_substring(s1, s2)
    print(cs)