D = 4
n = 50
m = 1234

from typing import Callable
import time

def naive_lfib(D: int, m: int) -> Callable[[int, bool], list[int] | int]:
    """
    Creates a Lagged Fibonacci Generator (LFG) function.

    Args:
        D (int): The lag period of the generator. Must be >= 2.
        m (int): The modulus to apply for generating the sequence. Must be > 0.

    Returns:
        Callable[[int, bool], list[int] | int]: A generator function that produces
        the sequence up to the nth element or the last element only.

        The generator function has the following parameters:
            n (int): The number of terms to generate in the sequence. Must be >= D.
            full_sequence (bool): Whether to return the full sequence or just the nth term.
                Defaults to True (return full sequence).

    Examples:
        >>> gen = naive_lfib(5, 100)
        >>> S = gen(10)
        >>> print(S)  # Full sequence
        >>> print(gen(10, full_sequence=False))  # Last term only
    """
    def generator(n: int, full_sequence: bool = True) -> list[int] | int:
        if D < 2:
            raise ValueError("D must be at least 2.")
        if m <= 0:
            raise ValueError("m must be greater than 0.")
        if n < D:
            raise ValueError("n must be greater than or equal to D.")

        # Initialize the sequence with D initial terms set to 1
        S: list[int] = [1] * D

        # Generate terms up to the nth term using the LFG formula
        for _ in range(n - D + 1):
            S.append((S[-D] + S[-D + 1]) % m)

        # Return the full sequence or just the last term based on the flag
        return S if full_sequence else S[-1]

    return generator

# Example usage
D = 5
m = 100
n = 30

start = time.time()
gen = naive_lfib(D, m)
S = gen(n)

print("Time needed (in seconds):", time.time() - start)

print(f"Solution for S_{n} (mod {m}) is {S[-1]}")
print("The whole sequence is:")
print(S)

Time needed (in seconds): 0.0001308917999267578
Solution for S_30 (mod 100) is 71
The whole sequence is:
[1, 1, 1, 1, 1, 2, 2, 2, 2, 3, 4, 4, 4, 5, 7, 8, 8, 9, 12, 15, 16, 17, 21, 27, 31, 33, 38, 48, 58, 64, 71]

import numpy
import cupy
import sympy
from typing import Callable, Tuple

def fast_lfib(D: int, m: int, xp=numpy) -> Tuple[Callable[[int], int], numpy.ndarray | cupy.ndarray]:
    """
    Creates a fast Lagged Fibonacci Generator (LFG) using matrix exponentiation.

    Args:
        D (int): The lag period of the generator. Must be >= 2.
        m (int): The modulus to apply for generating the sequence. Must be > 0.
        xp: The array library to use for computation (e.g., `numpy` or `cupy`).
            Defaults to `numpy`.

    Returns:
        Tuple[Callable[[int], int], numpy.ndarray | cupy.ndarray]:
            - A generator function that computes $S_n$ efficiently.
            - The transformation matrix $\mathbf{Q}$ used for matrix exponentiation.

    Examples:
        >>> generator, Q = fast_lfib(5, 100, xp=numpy)
        >>> S_n = generator(10)
        >>> print(S_n)
    """
    Q = xp.zeros((D, D), dtype=xp.int64)
    Q[-1, 0] = 1
    Q[-1, 1] = 1

    i, j = 0, 1
    while j < D:
        Q[i, j] = 1
        i, j = i + 1, j + 1

    def fast_pow(A: numpy.ndarray | cupy.ndarray, p: int, m: int) -> numpy.ndarray | cupy.ndarray:
        """
        Computes $A^p \mod m$ using binary exponentiation.

        Args:
            A (numpy.ndarray | cupy.ndarray): The input matrix.
            p (int): The power to raise the matrix to. Must be >= 0.
            m (int): The modulus to apply. Must be > 0.

        Returns:
            numpy.ndarray | cupy.ndarray: The result of $A^p \mod m$.
        """
        res = xp.eye(A.shape[0], dtype=xp.int64)
        while p > 0:
            if (p & 1) > 0:
                res = (res @ A) % m
            p //= 2
            A = (A @ A) % m
        return res

    def generator(n: int) -> int:
        """
        Computes the $n$th term in the Lagged Fibonacci sequence.

        Args:
            n (int): The index of the term to compute. Must be >= D.

        Returns:
            int: The value of $S_n \mod m$.
        """
        SS = fast_pow(Q, n - D + 1, m)
        return int(SS[-1, :].sum() % m)

    return generator, Q

D = 5
n = 2**10+5
m = 1234567891011

gen, Q = fast_lfib(D=D, m=m, xp=cupy)
print("Lagged Fibonacci Matrix Q:")
sympy.Matrix(Q.get()) # .get() only required for cupy
# sympy.print_latex(sympy.Matrix(Q.get()))

Lagged Fibonacci Matrix Q:

start = time.time()
S = gen(n)
print("Time needed (in seconds):", time.time() - start)
print(f"Solution for S_{n} (mod {m}) is {S}")

Time needed (in seconds): 0.0023157596588134766
Solution for S_1029 (mod 1234567891011) is 253512699721

D = 4000
n = 10**20
m = 1234567891011

gen, Q = fast_lfib(D=D, m=m, xp=cupy)

start = time.time()
S = gen(n)
print("Time needed (in seconds):", time.time() - start)
print(f"Solution for S_{n} (mod {m}) is {S}")

Time needed (in seconds): 14.027729272842407
Solution for S_100000000000000000000 (mod 1234567891011) is 838042074774

Fast Computation of the Lagged Fibonacci Generator¶

Naive Implementation¶

Faster Implementation¶

Final Example: Compute $S_n$ with a large value of $n$ and $D$¶