Source code for nlsq.caching.unified_cache

"""Unified JAX JIT compilation cache for NLSQ.

This module consolidates three independent cache implementations
(compilation_cache.py, caching.py, smart_cache.py) into a single unified cache
with shape-relaxed keys, comprehensive statistics tracking, and optimized memory management.

Key Features
------------
- Shape-relaxed cache keys: (func_hash, dtype, rank) instead of full shapes
- Comprehensive statistics: hits, misses, compile_time_ms, hit_rate
- LRU eviction with configurable maxsize
- Optional two-tier caching (memory + disk)
- Weak references to avoid memory leaks
- Thread-safe operations via per-instance threading.Lock
- Async disk writes (deferred to Phase 2)

Design Goals
------------
1. 80%+ cache hit rate on typical batch fitting workflows
2. 2-5x reduction in cold-start compile time through better cache reuse
3. Backward compatibility with existing cache APIs (gradual migration)
4. Zero breaking changes to curve_fit API
"""

import hashlib
import logging
import threading
import time
from collections import OrderedDict
from collections.abc import Callable
from functools import wraps
from typing import Any

import jax
import jax.numpy as jnp
import numpy as np

logger = logging.getLogger(__name__)



[docs]
class UnifiedCache:
    """Unified compilation cache merging three legacy cache patterns.

    This cache provides:
    - Shape-relaxed keys: cache based on (func_hash, dtype, rank) not exact shapes
    - Comprehensive stats: hits, misses, compile_time_ms, hit_rate, cache_size
    - LRU eviction when maxsize exceeded
    - Optional disk caching (two-tier architecture)
    - Weak references to functions to prevent memory leaks
    - Thread-safe operations via per-instance lock

    Attributes
    ----------
    maxsize : int
        Maximum number of compiled functions to cache
    enable_stats : bool
        Whether to track cache statistics
    disk_cache_enabled : bool
        Whether to enable disk caching (default: False for Phase 1)

    Examples
    --------
    >>> cache = UnifiedCache(maxsize=128, enable_stats=True)
    >>> def my_func(x, a):
    ...     return a * x ** 2
    >>> x = jnp.array([1.0, 2.0, 3.0])
    >>> compiled = cache.get_or_compile(my_func, (x, 1.0), {}, static_argnums=(1,))
    >>> result = compiled(x, 1.0)
    >>> stats = cache.get_stats()
    >>> print(f"Hit rate: {stats['hit_rate']:.2%}")
    """


[docs]
    def __init__(
        self,
        maxsize: int = 128,
        enable_stats: bool = True,
        disk_cache_enabled: bool = False,  # Deferred to Phase 2 (Task Group 9)
    ):
        """Initialize unified cache.

        Parameters
        ----------
        maxsize : int, default=128
            Maximum number of compiled functions to cache (LRU eviction)
        enable_stats : bool, default=True
            Track cache statistics (hits, misses, compile_time_ms)
        disk_cache_enabled : bool, default=False
            Enable disk caching tier (Phase 2 feature)
        """
        self.maxsize = maxsize
        self.enable_stats = enable_stats
        self.disk_cache_enabled = disk_cache_enabled

        # LRU cache: OrderedDict preserves insertion order for efficient eviction
        self._cache: OrderedDict[str, Callable] = OrderedDict()

        # Compilation time tracking per cache key (ms)
        self._compile_times: dict[str, float] = {}

        # Statistics tracking
        if enable_stats:
            self._stats = {
                "hits": 0,
                "misses": 0,
                "compilations": 0,
                "evictions": 0,
                "cache_size": 0,
            }
        else:
            self._stats = {}

        # Per-instance lock for thread-safe cache operations
        self._lock = threading.Lock()


    def _get_function_hash(self, func: Callable) -> str:
        """Generate stable hash for a function.

        Uses function source code, signature, module, and name to create
        a stable hash that persists across sessions.

        Parameters
        ----------
        func : Callable
            Function to hash

        Returns
        -------
        func_hash : str
            Hexadecimal hash string (16 characters)
        """
        try:
            # Try to get source code for regular functions (from caching.py pattern)
            import inspect

            source = inspect.getsource(func)
            signature = str(inspect.signature(func))
            module = getattr(func, "__module__", "unknown")
            name = getattr(func, "__name__", "unknown")

            # Combine all identifying information
            combined = f"{module}.{name}:{signature}\n{source}"
            return hashlib.sha256(combined.encode()).hexdigest()[:16]

        except (OSError, TypeError):
            # Fallback for built-in functions, lambdas, or C functions
            try:
                if hasattr(func, "__code__"):
                    code = func.__code__
                    code_hash = hashlib.sha256(code.co_code).hexdigest()[:8]
                    return f"code_{code_hash}_{code.co_argcount}"
                else:
                    # Use qualified name for a persistent key instead of id()
                    name = getattr(
                        func,
                        "__qualname__",
                        getattr(func, "__name__", "unknown"),
                    )
                    module = getattr(func, "__module__", "unknown")
                    return hashlib.sha256(f"{module}.{name}".encode()).hexdigest()[:16]
            except (AttributeError, TypeError, ValueError):
                name = getattr(
                    func, "__qualname__", getattr(func, "__name__", "unknown")
                )
                return hashlib.sha256(name.encode()).hexdigest()[:16]

    def _get_array_signature(self, arr) -> str:
        """Get signature for array based on dtype and rank (shape-relaxed).

        This is the key innovation: instead of caching by exact shape,
        cache by (dtype, rank) to enable reuse across different array sizes.

        Parameters
        ----------
        arr : array-like
            JAX or NumPy array

        Returns
        -------
        signature : str
            Signature string: "{dtype}_rank{rank}"
        """
        if isinstance(arr, (np.ndarray, jnp.ndarray, jax.Array)):
            dtype = str(arr.dtype)
            rank = len(arr.shape)
            return f"{dtype}_rank{rank}"
        else:
            # For non-arrays (scalars, etc.), use type name
            return type(arr).__name__

    def _generate_cache_key(
        self,
        func: Callable,
        args: tuple,
        kwargs: dict,
        static_argnums: tuple[int, ...],
    ) -> str:
        """Generate cache key from function and arguments (shape-relaxed).

        Cache key structure: (func_hash, static_argnums, dtype_rank_signatures)

        This enables cache hits across different array sizes with same dtype/rank,
        reducing compilation overhead by 2-5x.

        Parameters
        ----------
        func : Callable
            Function to cache
        args : tuple
            Positional arguments
        kwargs : dict
            Keyword arguments
        static_argnums : tuple of int
            Indices of static arguments

        Returns
        -------
        cache_key : str
            MD5 hash of key components
        """
        key_parts = []

        # 1. Function hash
        func_hash = self._get_function_hash(func)
        key_parts.append(f"func:{func_hash}")

        # 2. Static argnums
        key_parts.append(f"static:{static_argnums}")

        # 3. Array signatures (shape-relaxed: dtype + rank only)
        for i, arg in enumerate(args):
            if i in static_argnums:
                # Static args included in key by value
                key_parts.append(f"arg{i}_static:{arg}")
            else:
                # Non-static args: use dtype + rank only (not full shape)
                sig = self._get_array_signature(arg)
                key_parts.append(f"arg{i}:{sig}")

        # 4. Keyword arguments
        for k, v in sorted(kwargs.items()):
            if isinstance(v, (np.ndarray, jnp.ndarray, jax.Array)):
                sig = self._get_array_signature(v)
                key_parts.append(f"kwarg_{k}:{sig}")
            else:
                key_parts.append(f"kwarg_{k}:{v}")

        # Generate MD5 hash of key string
        key_str = "|".join(key_parts)
        return hashlib.md5(key_str.encode(), usedforsecurity=False).hexdigest()


[docs]
    def get_or_compile(
        self,
        func: Callable,
        args: tuple,
        kwargs: dict,
        static_argnums: tuple[int, ...] = (),
        donate_argnums: tuple[int, ...] = (),
    ) -> Callable:
        """Get cached compiled function or compile if not cached.

        Thread-safe: the lock is held for dict operations only and released
        during expensive JIT compilation to avoid serializing parallel
        compilations.  A re-check after compilation prevents duplicate
        stores when multiple threads miss on the same key simultaneously.

        Parameters
        ----------
        func : Callable
            Function to compile
        args : tuple
            Arguments to function (for signature generation)
        kwargs : dict
            Keyword arguments
        static_argnums : tuple of int, default=()
            Indices of static arguments for JIT
        donate_argnums : tuple of int, default=()
            Indices of arguments to donate for memory efficiency

        Returns
        -------
        compiled_func : Callable
            JIT-compiled function (from cache or newly compiled)
        """
        # Generate cache key (pure computation, no shared state)
        cache_key = self._generate_cache_key(func, args, kwargs, static_argnums)

        # Check cache under lock; record miss stats in the same acquisition
        with self._lock:
            if cache_key in self._cache:
                if self.enable_stats:
                    self._stats["hits"] += 1
                self._cache.move_to_end(cache_key)
                logger.debug(f"Cache hit for key {cache_key[:8]}...")
                return self._cache[cache_key]

            # Cache miss -- update stats while we still hold the lock
            if self.enable_stats:
                self._stats["misses"] += 1
                self._stats["compilations"] += 1

        # Compile outside lock (expensive, don't serialize)
        logger.debug(f"Cache miss for key {cache_key[:8]}..., compiling")
        start_time = time.time()
        compiled_func = jax.jit(
            func, static_argnums=static_argnums, donate_argnums=donate_argnums
        )
        compile_time_ms = (time.time() - start_time) * 1000

        # Store under lock (re-check to avoid duplicate compilation)
        with self._lock:
            # Another thread may have stored while we compiled
            if cache_key in self._cache:
                # Use the already-stored version, discard ours
                self._cache.move_to_end(cache_key)
                return self._cache[cache_key]

            self._compile_times[cache_key] = compile_time_ms

            if len(self._cache) >= self.maxsize:
                oldest_key = next(iter(self._cache))
                del self._cache[oldest_key]
                if oldest_key in self._compile_times:
                    del self._compile_times[oldest_key]
                if self.enable_stats:
                    self._stats["evictions"] += 1
                logger.debug(f"Evicted cache entry {oldest_key[:8]}... (LRU)")

            self._cache[cache_key] = compiled_func

            if self.enable_stats:
                self._stats["cache_size"] = len(self._cache)

        return compiled_func



[docs]
    def get_stats(self) -> dict[str, Any]:
        """Get cache statistics.

        Returns
        -------
        stats : dict
            Cache statistics including:
            - hits : int - Number of cache hits
            - misses : int - Number of cache misses
            - compilations : int - Number of JIT compilations performed
            - evictions : int - Number of LRU evictions
            - cache_size : int - Current cache size
            - hit_rate : float - Cache hit rate (hits / total_requests)
            - compile_time_ms : float - Total compilation time in milliseconds
        """
        if not self.enable_stats:
            return {"enabled": False}

        with self._lock:
            total_requests = self._stats["hits"] + self._stats["misses"]
            hit_rate = (
                self._stats["hits"] / total_requests if total_requests > 0 else 0.0
            )
            total_compile_time_ms = sum(self._compile_times.values())
            return {
                **self._stats,
                "hit_rate": hit_rate,
                "total_requests": total_requests,
                "compile_time_ms": total_compile_time_ms,
            }



[docs]
    def clear(self):
        """Clear all cached compilations and reset statistics."""
        with self._lock:
            self._cache.clear()
            self._compile_times.clear()

            if self.enable_stats:
                self._stats = {
                    "hits": 0,
                    "misses": 0,
                    "compilations": 0,
                    "evictions": 0,
                    "cache_size": 0,
                }

        logger.info("Unified cache cleared")



[docs]
    def __repr__(self) -> str:
        """String representation of cache."""
        if self.enable_stats:
            stats = self.get_stats()
            return (
                f"UnifiedCache(size={stats['cache_size']}/{self.maxsize}, "
                f"hit_rate={stats['hit_rate']:.2%}, "
                f"compilations={stats['compilations']})"
            )
        else:
            with self._lock:
                size = len(self._cache)
            return f"UnifiedCache(size={size}/{self.maxsize})"




# Global unified cache instance
_global_unified_cache: UnifiedCache | None = None
_global_unified_cache_lock = threading.Lock()



[docs]
def get_global_cache() -> UnifiedCache:
    """Get or create global unified cache instance (thread-safe).

    Returns
    -------
    cache : UnifiedCache
        Global unified cache instance
    """
    global _global_unified_cache  # noqa: PLW0603
    if _global_unified_cache is not None:  # Fast path (no lock)
        return _global_unified_cache
    with _global_unified_cache_lock:
        if _global_unified_cache is None:  # Double-check under lock
            _global_unified_cache = UnifiedCache(maxsize=128, enable_stats=True)
        return _global_unified_cache




[docs]
def clear_cache():
    """Clear the global unified cache."""
    global _global_unified_cache  # noqa: PLW0602
    if _global_unified_cache is not None:
        _global_unified_cache.clear()




[docs]
def cached_jit(
    func: Callable | None = None,
    static_argnums: tuple[int, ...] = (),
    donate_argnums: tuple[int, ...] = (),
) -> Callable:
    """Decorator for cached JIT compilation using unified cache.

    This decorator provides automatic caching of JIT-compiled functions
    with shape-relaxed keys for better cache reuse.

    Parameters
    ----------
    func : Callable, optional
        Function to decorate
    static_argnums : tuple of int, default=()
        Indices of static arguments
    donate_argnums : tuple of int, default=()
        Indices of arguments to donate

    Returns
    -------
    decorated : Callable
        Decorated function with cached compilation

    Examples
    --------
    >>> @cached_jit(static_argnums=(1,))
    ... def my_function(x, n):
    ...     return x ** n

    >>> @cached_jit
    ... def simple_function(x):
    ...     return x ** 2
    """

    def decorator(f: Callable) -> Callable:
        cache = get_global_cache()

        @wraps(f)
        def wrapper(*args, **kwargs):
            compiled_func = cache.get_or_compile(
                f,
                args,
                kwargs,
                static_argnums=static_argnums,
                donate_argnums=donate_argnums,
            )
            return compiled_func(*args, **kwargs)

        # Store reference to original function
        wrapper.__wrapped__ = f
        return wrapper

    if func is None:
        # Called with arguments: @cached_jit(static_argnums=(1,))
        return decorator
    else:
        # Called without arguments: @cached_jit
        return decorator(func)




[docs]
def get_cache_stats() -> dict[str, Any]:
    """Get statistics from the global unified cache.

    Returns
    -------
    stats : dict
        Cache statistics
    """
    return get_global_cache().get_stats()



# Backward compatibility wrappers for gradual migration
# These preserve the existing cache APIs from compilation_cache.py, caching.py, smart_cache.py



[docs]
class CompilationCacheCompat:
    """Backward compatibility wrapper for compilation_cache.py API.

    This allows gradual migration of existing code using CompilationCache
    to the new UnifiedCache without breaking changes.
    """


[docs]
    def __init__(self, enable_stats: bool = True):
        """Initialize compatibility wrapper."""
        self._cache = UnifiedCache(enable_stats=enable_stats)



[docs]
    def compile(
        self,
        func: Callable,
        static_argnums: tuple[int, ...] = (),
        donate_argnums: tuple[int, ...] = (),
    ) -> Callable:
        """Compile function with JIT and cache result (compatibility wrapper)."""
        # Use empty args for key generation (will be refined on actual call)
        return self._cache.get_or_compile(
            func,
            args=(),
            kwargs={},
            static_argnums=static_argnums,
            donate_argnums=donate_argnums,
        )



[docs]
    def get_stats(self) -> dict:
        """Get cache statistics (compatibility wrapper)."""
        return self._cache.get_stats()



[docs]
    def clear(self):
        """Clear cache (compatibility wrapper)."""
        self._cache.clear()





[docs]
class FunctionCacheCompat:
    """Backward compatibility wrapper for caching.py API."""


[docs]
    def __init__(self, maxsize: int = 128):
        """Initialize compatibility wrapper."""
        self._cache = UnifiedCache(maxsize=maxsize, enable_stats=True)



[docs]
    def get_function_hash(self, func: Callable) -> str:
        """Generate stable hash for a function (compatibility wrapper)."""
        return self._cache._get_function_hash(func)



[docs]
    def get_stats(self) -> dict[str, Any]:
        """Get cache statistics (compatibility wrapper)."""
        return self._cache.get_stats()



[docs]
    def clear(self):
        """Clear cache (compatibility wrapper)."""
        self._cache.clear()


    @property
    def hit_rate(self) -> float:
        """Get cache hit rate (compatibility wrapper)."""
        stats = self._cache.get_stats()
        return stats.get("hit_rate", 0.0)