Source code for haive.core.persistence.handlers

"""High-level persistence handling utilities for the Haive framework.

This module provides high-level functions for managing persistence operations,
including checkpointer creation, configuration interpretation, state recovery,
and thread management. It serves as a convenient interface layer that abstracts
away the details of specific persistence implementations.

The utilities in this module are designed to work with both simple configuration
dictionaries and full CheckpointerConfig objects, automatically handling fallbacks,
error recovery, and sensible defaults. They provide a robust interface for both
synchronous and asynchronous usage patterns.

Key functions:
- setup_checkpointer: Create appropriate checkpointer based on configuration
- get_checkpoint: Retrieve state from persistence
- put_checkpoint: Store state in persistence
- register_thread: Register a thread for tracking and management

This module enables a more declarative approach to persistence configuration,
allowing users to specify what they want rather than how to implement it.
"""

import inspect
import json
import logging
from typing import Any

from psycopg_pool import AsyncConnectionPool
from psycopg_pool.pool import ConnectionPool
from pydantic import BaseModel, SecretStr

from haive.core.persistence.memory import MemoryCheckpointerConfig
from haive.core.persistence.postgres_config import PostgresCheckpointerConfig
from haive.core.persistence.types import CheckpointerMode, CheckpointStorageMode

logger = logging.getLogger(__name__)



[docs]
def setup_checkpointer(config: Any) -> Any:
    """Set up the appropriate checkpointer based on persistence configuration.

    This function creates and configures a checkpointer instance based on the
    provided configuration. It handles a variety of configuration formats,
    including direct CheckpointerConfig objects and configuration dictionaries
    embedded in larger config objects.

    The function provides intelligent fallbacks and error handling, ensuring that
    a working checkpointer is always returned - falling back to a memory checkpointer
    if the requested configuration cannot be satisfied.

    Args:
        config: Configuration containing persistence settings, which can be:
            - A direct CheckpointerConfig instance
            - An object with a 'persistence' attribute containing configuration
            - An object with a 'persistence' dictionary specifying type and parameters

    Returns:
        Any: A configured checkpointer instance ready for use

    Examples::

        # Using a direct config object
        from haive.core.persistence import MemoryCheckpointerConfig
        memory_config = MemoryCheckpointerConfig()
        checkpointer = setup_checkpointer(memory_config)

        # Using a config object with persistence attribute
        class AgentConfig:
            def __init__(self):
                self.persistence = {"type": "postgres", "db_host": "localhost"}

        agent_config = AgentConfig()
        checkpointer = setup_checkpointer(agent_config)

        # With fallback to memory if configuration fails
        try:
            checkpointer = setup_checkpointer({"persistence": {"type": "invalid"}})
            # Will fall back to memory checkpointer
        except Exception:
            # Should not reach here - function handles errors internally
            pass
    """
    # Default to memory checkpointer
    if not hasattr(config, "persistence") or config.persistence is None:
        logger.info(
            f"No persistence config for { getattr(config, 'name', 'unnamed') }. Using memory checkpointer."
        )
        memory_config = MemoryCheckpointerConfig()
        return memory_config.create_checkpointer()

    # Handle already created checkpointer
    if hasattr(config.persistence, "create_checkpointer"):
        # It's a CheckpointerConfig instance
        try:
            return config.persistence.create_checkpointer()
        except Exception as e:
            logger.exception(f"Failed to create checkpointer: {e}")
            logger.warning(
                f"Falling back to memory checkpointer for {getattr(config, 'name', 'unnamed')}"
            )
            memory_config = MemoryCheckpointerConfig()
            return memory_config.create_checkpointer()

    # Handle dictionary config
    if isinstance(config.persistence, dict):
        # Parse the persistence config
        persistence_type = config.persistence.get("type", "memory")

        if persistence_type == "memory":
            # Memory checkpointer
            memory_config = MemoryCheckpointerConfig()
            return memory_config.create_checkpointer()

        if persistence_type == "postgres":
            # PostgreSQL checkpointer
            try:
                # Get connection parameters
                use_shallow = config.persistence.get("shallow", False)
                use_async = config.persistence.get("async", False)

                # Create the config
                postgres_config = PostgresCheckpointerConfig(
                    checkpoint_mode=(
                        CheckpointStorageMode.shallow
                        if use_shallow
                        else CheckpointStorageMode.standard
                    ),
                    sync_mode=(
                        CheckpointerMode.async_ if use_async else CheckpointerMode.sync
                    ),
                    db_host=config.persistence.get("db_host", "localhost"),
                    db_port=config.persistence.get("db_port", 5432),
                    db_name=config.persistence.get("db_name", "postgres"),
                    db_user=config.persistence.get("db_user", "postgres"),
                    db_pass=config.persistence.get("db_pass", "postgres"),
                    ssl_mode=config.persistence.get("ssl_mode", "disable"),
                    min_pool_size=config.persistence.get("min_pool_size", 1),
                    max_pool_size=config.persistence.get("max_pool_size", 5),
                    auto_commit=config.persistence.get("auto_commit", True),
                    prepare_threshold=config.persistence.get("prepare_threshold", 0),
                    setup_needed=config.persistence.get("setup_needed", True),
                    connection_string=config.persistence.get("connection_string"),
                    use_pipeline=config.persistence.get("use_pipeline", False),
                )

                return postgres_config.create_checkpointer()
            except Exception as e:
                logger.exception(f"Failed to create PostgreSQL checkpointer: {e}")
                logger.warning(
                    f"Falling back to memory checkpointer for {getattr(config, 'name', 'unnamed')}"
                )
                memory_config = MemoryCheckpointerConfig()
                return memory_config.create_checkpointer()

    # Default to memory checkpointer for any other case
    logger.info(
        f"Using memory checkpointer (default) for {getattr(config, 'name', 'unnamed')}"
    )
    memory_config = MemoryCheckpointerConfig()
    return memory_config.create_checkpointer()




[docs]
async def setup_async_checkpointer(config: Any) -> Any:
    """Set up the appropriate async checkpointer based on persistence configuration.

    This function analyzes the provided configuration and creates the appropriate
    async checkpointer based on the persistence settings. It properly handles
    different checkpointer types with a focus on async PostgreSQL connections.

    Args:
        config: Configuration containing persistence settings

    Returns:
        A configured async checkpointer instance
    """

    logger = logging.getLogger(__name__)

    # Default to memory checkpointer
    if not hasattr(config, "persistence") or config.persistence is None:
        logger.info(
            f"No persistence config for { getattr(config, 'name', 'unnamed') }. Using memory checkpointer."
        )

        memory_config = MemoryCheckpointerConfig()
        return memory_config.create_checkpointer()

    # Handle the case where persistence is a CheckpointerConfig instance
    if hasattr(config.persistence, "create_async_checkpointer"):
        # It's a CheckpointerConfig instance
        try:
            # Use the async creation method
            return await config.persistence.create_async_checkpointer()
        except Exception as e:
            logger.exception(f"Failed to create async checkpointer: {e}")
            logger.warning(
                f"Falling back to memory checkpointer for {getattr(config, 'name', 'unnamed')}"
            )

            memory_config = MemoryCheckpointerConfig()
            return memory_config.create_checkpointer()

    # Handle dictionary config
    if isinstance(config.persistence, dict):
        # Parse the persistence config
        persistence_type = config.persistence.get("type", "memory")

        if persistence_type == "memory":
            # Memory checkpointer

            memory_config = MemoryCheckpointerConfig()
            return memory_config.create_checkpointer()

        if persistence_type == "postgres":
            # PostgreSQL checkpointer
            try:
                # Get connection parameters

                # Extract configuration
                use_shallow = config.persistence.get("shallow", False)

                # Always use async mode for this function

                # Create the config
                postgres_config = PostgresCheckpointerConfig(
                    mode=CheckpointerMode.ASYNC,
                    storage_mode=(
                        CheckpointStorageMode.SHALLOW
                        if use_shallow
                        else CheckpointStorageMode.FULL
                    ),
                    db_host=config.persistence.get("db_host", "localhost"),
                    db_port=config.persistence.get("db_port", 5432),
                    db_name=config.persistence.get("db_name", "postgres"),
                    db_user=config.persistence.get("db_user", "postgres"),
                    db_pass=SecretStr(config.persistence.get("db_pass", "postgres")),
                    ssl_mode=config.persistence.get("ssl_mode", "disable"),
                    min_pool_size=config.persistence.get("min_pool_size", 1),
                    max_pool_size=config.persistence.get("max_pool_size", 5),
                    auto_commit=config.persistence.get("auto_commit", True),
                    prepare_threshold=config.persistence.get("prepare_threshold", 0),
                    setup_needed=config.persistence.get("setup_needed", True),
                    connection_kwargs=config.persistence.get("connection_kwargs", {}),
                )

                # Create async checkpointer
                return await postgres_config.create_async_checkpointer()
            except Exception as e:
                logger.exception(f"Failed to create async PostgreSQL checkpointer: {e}")
                logger.warning(
                    f"Falling back to memory checkpointer for {getattr(config, 'name', 'unnamed')}"
                )

                memory_config = MemoryCheckpointerConfig()
                return memory_config.create_checkpointer()

    # Default to memory checkpointer for any other case
    logger.info(
        f"Using memory checkpointer (default) for {getattr(config, 'name', 'unnamed')}"
    )

    memory_config = MemoryCheckpointerConfig()
    return memory_config.create_checkpointer()




[docs]
def ensure_pool_open(checkpointer: Any) -> Any | None:
    """Ensure that any PostgreSQL connection pool is properly opened.

    This should be called before any operation that uses the checkpointer.

    Args:
        checkpointer: The checkpointer to check

    Returns:
        The opened pool if one was found and opened, None otherwise
    """
    opened_pool = None
    try:
        # Check for connection pools in the checkpointer
        if hasattr(checkpointer, "conn"):
            conn = checkpointer.conn

            # Import here to avoid dependency issues
            try:
                # Check if it's a pool
                if isinstance(conn, (ConnectionPool, AsyncConnectionPool)):
                    # Check if the pool is already open
                    try:
                        if hasattr(conn, "is_open"):
                            is_open = conn.is_open()
                        else:
                            # Older versions might not have is_open()
                            is_open = getattr(conn, "_opened", False)

                        # Open the pool if needed
                        if not is_open:
                            logger.info("Opening PostgreSQL connection pool")
                            try:
                                conn.open()
                                opened_pool = conn
                                logger.info("Successfully opened pool")
                            except Exception as e:
                                logger.exception(f"Error opening pool: {e}")

                                # Try a different approach with direct pool
                                # access
                                if hasattr(conn, "_pool"):
                                    logger.info(
                                        "Trying alternative pool opening method"
                                    )
                                    conn._pool = (
                                        []
                                        if not hasattr(conn, "_pool")
                                        or conn._pool is None
                                        else conn._pool
                                    )
                                    conn._opened = True
                                    opened_pool = conn
                    except Exception as e:
                        logger.exception(f"Error checking if pool is open: {e}")
                        # Last ditch effort - try direct attribute manipulation
                        if hasattr(conn, "_pool"):
                            conn._pool = (
                                []
                                if not hasattr(conn, "_pool") or conn._pool is None
                                else conn._pool
                            )
                            conn._opened = True
                            opened_pool = conn
            except ImportError:
                logger.debug("psycopg_pool not available")

        # Additional check for other types of pools or connections
        if not opened_pool and hasattr(checkpointer, "setup"):
            # If the checkpointer has a setup method but no connection was found,
            # just make sure tables are set up
            logger.debug("No pool found but checkpointer has setup method")
            try:
                checkpointer.setup()
            except Exception as e:
                logger.exception(f"Error setting up checkpointer: {e}")

    except Exception as e:
        logger.exception(f"Error ensuring pool is open: {e}")

    return opened_pool




[docs]
async def ensure_async_pool_open(checkpointer: Any) -> Any | None:
    """Ensure that any async PostgreSQL connection pool is properly opened.

    This should be called before any async operation that uses the checkpointer.

    Args:
        checkpointer: The checkpointer to check

    Returns:
        The opened pool if one was found and opened, None otherwise
    """

    logger = logging.getLogger(__name__)

    opened_pool = None
    try:
        # Skip for non-PostgreSQL checkpointers
        if (
            hasattr(checkpointer, "__class__")
            and "Postgres" not in checkpointer.__class__.__name__
        ):
            return None

        # Check for connection pools in the checkpointer
        if hasattr(checkpointer, "conn"):
            conn = checkpointer.conn

            # Import here to avoid dependency issues
            try:
                # Check if it's an async pool
                if isinstance(conn, AsyncConnectionPool):
                    # Check if the pool is already open
                    try:
                        if hasattr(conn, "is_open"):
                            is_open = await conn.is_open()
                        else:
                            # Older versions might not have is_open()
                            is_open = getattr(conn, "_opened", False)

                        # Open the pool if needed
                        if not is_open:
                            logger.info("Opening async PostgreSQL connection pool")
                            try:
                                await conn.open()
                                opened_pool = conn
                                logger.info("Successfully opened async pool")
                            except Exception as e:
                                logger.exception(f"Error opening async pool: {e}")

                                # Try a different approach with direct pool
                                # access
                                if hasattr(conn, "_pool"):
                                    logger.info(
                                        "Trying alternative pool opening method"
                                    )
                                    conn._pool = (
                                        []
                                        if not hasattr(conn, "_pool")
                                        or conn._pool is None
                                        else conn._pool
                                    )
                                    conn._opened = True
                                    opened_pool = conn
                    except Exception as e:
                        logger.exception(f"Error checking if async pool is open: {e}")
                        # Last ditch effort - try direct attribute manipulation
                        if hasattr(conn, "_pool"):
                            conn._pool = (
                                []
                                if not hasattr(conn, "_pool") or conn._pool is None
                                else conn._pool
                            )
                            conn._opened = True
                            opened_pool = conn
            except ImportError:
                logger.debug("psycopg_pool not available for async operations")

        # Additional check for setup method
        if not opened_pool and hasattr(checkpointer, "setup"):
            try:
                # If setup method is async, call it

                if inspect.iscoroutinefunction(checkpointer.setup):
                    await checkpointer.setup()
                # Otherwise it's a sync method, skip
            except Exception as e:
                logger.exception(f"Error setting up async checkpointer: {e}")

    except Exception as e:
        logger.exception(f"Error ensuring async pool is open: {e}")

    return opened_pool



async def close_async_pool_if_needed(checkpointer: Any, pool: Any = None) -> None:
    """Close an async PostgreSQL connection pool if it was previously opened.

    This should be called in finally blocks after async operations.

    Args:
        checkpointer: The checkpointer to check
        pool: The pool to close. If None, will try to find the pool
            from the checkpointer.
    """

    logger = logging.getLogger(__name__)

    if pool is None:
        # Try to find a pool from the checkpointer
        try:
            if hasattr(checkpointer, "conn"):
                pool = checkpointer.conn
        except AttributeError:
            return

    # Close the pool if it's an AsyncConnectionPool
    try:
        if isinstance(pool, AsyncConnectionPool):
            try:
                is_open = False
                if hasattr(pool, "is_open"):
                    is_open = await pool.is_open()
                else:
                    is_open = getattr(pool, "_opened", False)

                if is_open:
                    logger.debug("Closing async PostgreSQL connection pool")
                    # We don't actually close the pool unless explicitly requested
                    # as it's generally reused across invocations
            except Exception as e:
                logger.warning(f"Error checking async pool status: {e}")
    except (ImportError, AttributeError) as e:
        logger.debug(f"Error importing AsyncConnectionPool: {e}")


async def register_async_thread_if_needed(
    checkpointer: Any, thread_id: str, metadata: dict[str, Any] | None = None
) -> None:
    """Register a thread in the persistence system asynchronously if needed.

    Args:
        checkpointer: The checkpointer to use
        thread_id: Thread ID to register
        metadata: Optional metadata to associate with the thread
    """

    logger = logging.getLogger(__name__)

    # Skip for memory checkpointers
    if (
        hasattr(checkpointer, "__class__")
        and "Memory" in checkpointer.__class__.__name__
    ):
        return

    # Handle async PostgreSQL checkpointers
    if hasattr(checkpointer, "conn"):
        try:
            pool = checkpointer.conn

            if pool and isinstance(pool, AsyncConnectionPool):
                # Ensure connection pool is usable
                await ensure_async_pool_open(checkpointer)

                # Register the thread
                async with pool.connection() as conn, conn.cursor() as cursor:
                    # Check if threads table exists
                    await cursor.execute(
                        """
                            SELECT EXISTS (
                                SELECT FROM information_schema.tables
                                WHERE table_name = 'threads'
                            );
                        """
                    )
                    result = await cursor.fetchone()
                    table_exists = result[0] if result else False

                    if not table_exists:
                        logger.debug("Creating threads table")
                        await cursor.execute(
                            """
                                CREATE TABLE IF NOT EXISTS threads (
                                    thread_id TEXT PRIMARY KEY,
                                    thread_name TEXT DEFAULT NULL,
                                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                                    metadata JSONB DEFAULT '{}'::jsonb,
                                    user_id TEXT,
                                    last_access TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP
                                );
                            """
                        )

                    # Convert metadata to JSON string if provided
                    metadata_json = "{}"
                    if metadata:
                        metadata_json = json.dumps(metadata)

                    thread_name = metadata.get("thread_name") if metadata else None

                    # Insert the thread if not exists
                    await cursor.execute(
                        """
                            INSERT INTO threads (thread_id, thread_name, metadata, last_access)
                            VALUES (%s, %s, %s, CURRENT_TIMESTAMP)
                            ON CONFLICT (thread_id)
                            DO UPDATE SET
                                last_access = CURRENT_TIMESTAMP,
                                thread_name = EXCLUDED.thread_name,
                                metadata = EXCLUDED.metadata
                        """,
                        (thread_id, thread_name, metadata_json),
                    )

                    logger.info(
                        f"Thread {thread_id} registered/updated asynchronously in PostgreSQL"
                    )
        except Exception as e:
            logger.warning(f"Error registering thread asynchronously: {e}")



[docs]
def close_pool_if_needed(checkpointer: Any, pool: Any = None) -> None:
    """Close a PostgreSQL connection pool if it was previously opened.

    This should be called in finally blocks after operations.

    Args:
        checkpointer: The checkpointer to check
        pool: The pool to close. If None, will try to find the pool
            from the checkpointer.
    """
    if pool is None:
        # Try to find a pool from the checkpointer
        try:
            if hasattr(checkpointer, "conn"):
                pool = checkpointer.conn
        except AttributeError:
            return

    # Close the pool if it's a ConnectionPool
    try:
        if isinstance(pool, ConnectionPool) and pool.is_open():
            logger.debug("Closing PostgreSQL connection pool")
            # We don't actually close the pool - generally not recommended
            # unless you're sure you won't need it again
    except (ImportError, AttributeError):
        pass




[docs]
async def close_async_pool_if_needed(checkpointer: Any, pool: Any = None) -> None:
    """Close an async PostgreSQL connection pool if it was previously opened.

    This should be called in finally blocks after operations.

    Args:
        checkpointer: The checkpointer to check
        pool: The pool to close. If None, will try to find the pool
            from the checkpointer.
    """
    if pool is None:
        # Try to find a pool from the checkpointer
        try:
            if hasattr(checkpointer, "conn"):
                pool = checkpointer.conn
        except AttributeError:
            return

    # Close the pool if it's an AsyncConnectionPool
    try:
        if isinstance(pool, AsyncConnectionPool) and await pool.is_open():
            logger.debug("Closing async PostgreSQL connection pool")
            # Similarly, we don't actually close the pool
    except (ImportError, AttributeError):
        pass




[docs]
def register_thread_if_needed(
    checkpointer: Any, thread_id: str, metadata: dict[str, Any] | None = None
) -> None:
    """Register a thread in the persistence system if needed.

    Args:
        checkpointer: The checkpointer to use
        thread_id: Thread ID to register
        metadata: Optional metadata to associate with the thread
    """
    # Skip for memory checkpointers
    if (
        hasattr(checkpointer, "__class__")
        and checkpointer.__class__.__name__ == "MemorySaver"
    ):
        return

    # Handle PostgreSQL checkpointers
    if hasattr(checkpointer, "conn"):
        try:
            pool = checkpointer.conn
            if pool:
                # Ensure connection pool is usable
                ensure_pool_open(checkpointer)

                # Register the thread
                with pool.connection() as conn, conn.cursor() as cursor:
                    # Check if threads table exists
                    cursor.execute(
                        """
                            SELECT EXISTS (
                                SELECT FROM information_schema.tables
                                WHERE table_name = 'threads'
                            );
                        """
                    )
                    table_exists = cursor.fetchone()[0]

                    if not table_exists:
                        logger.debug("Creating threads table")
                        cursor.execute(
                            """
                                CREATE TABLE IF NOT EXISTS threads (
                                    thread_id TEXT PRIMARY KEY,
                                    thread_name TEXT,
                                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                                    metadata JSONB DEFAULT '{}'::jsonb,
                                    user_id TEXT,
                                    last_access TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP
                                );
                            """
                        )

                    # Convert metadata to JSON string if provided
                    metadata_json = "{}"
                    if metadata:
                        metadata_json = json.dumps(metadata)

                    thread_name = metadata.get("thread_name") if metadata else None

                    # Insert the thread if not exists
                    cursor.execute(
                        """
                            INSERT INTO threads (thread_id, thread_name, metadata, last_access)
                            VALUES (%s, %s, %s, CURRENT_TIMESTAMP)
                            ON CONFLICT (thread_id)
                            DO UPDATE SET
                                last_access = CURRENT_TIMESTAMP,
                                thread_name = EXCLUDED.thread_name,
                                metadata = EXCLUDED.metadata
                        """,
                        (thread_id, thread_name, metadata_json),
                    )

                    logger.info(f"Thread {thread_id} registered/updated in PostgreSQL")

                    # Initialize checkpoint metadata for new threads to prevent
                    # None errors
                    try:
                        # Check if this thread has any checkpoints
                        cursor.execute(
                            "SELECT COUNT(*) FROM checkpoints WHERE thread_id = %s",
                            (thread_id,),
                        )
                        checkpoint_count = cursor.fetchone()[0]

                        if checkpoint_count == 0:
                            logger.debug(
                                f"Initializing checkpoint metadata for new thread {thread_id}"
                            )
                            # We don't need to insert a checkpoint here - LangGraph will handle that
                            # Just ensuring the threads table is properly set
                            # up

                    except Exception as init_error:
                        logger.debug(
                            f"Could not check/initialize checkpoint metadata: {init_error}"
                        )
                        # This is not critical - LangGraph should handle
                        # initial checkpoint creation
        except Exception as e:
            logger.warning(f"Error registering thread: {e}")




[docs]
async def register_async_thread_if_needed(
    checkpointer: Any, thread_id: str, metadata: dict[str, Any] | None = None
) -> None:
    """Register a thread in the persistence system asynchronously if needed.

    Args:
        checkpointer: The checkpointer to use
        thread_id: Thread ID to register
        metadata: Optional metadata to associate with the thread
    """
    # Skip for memory checkpointers
    if (
        hasattr(checkpointer, "__class__")
        and checkpointer.__class__.__name__ == "MemorySaver"
    ):
        return

    # Handle async PostgreSQL checkpointers
    if hasattr(checkpointer, "conn"):
        try:
            pool = checkpointer.conn
            if pool:
                # Ensure connection pool is usable
                await ensure_async_pool_open(checkpointer)

                # Register the thread
                async with pool.connection() as conn, conn.cursor() as cursor:
                    # Check if threads table exists
                    await cursor.execute(
                        """
                            SELECT EXISTS (
                                SELECT FROM information_schema.tables
                                WHERE table_name = 'threads'
                            );
                        """
                    )
                    table_exists = (await cursor.fetchone())[0]

                    if not table_exists:
                        logger.debug("Creating threads table")
                        await cursor.execute(
                            """
                                CREATE TABLE IF NOT EXISTS threads (
                                    thread_id TEXT PRIMARY KEY,
                                    thread_name TEXT,
                                    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                                    metadata JSONB DEFAULT '{}'::jsonb,
                                    user_id TEXT,
                                    last_access TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP
                                );
                            """
                        )

                    # Convert metadata to JSON string if provided
                    metadata_json = "{}"
                    if metadata:
                        metadata_json = json.dumps(metadata)

                    thread_name = metadata.get("thread_name") if metadata else None

                    # Insert the thread if not exists
                    await cursor.execute(
                        """
                            INSERT INTO threads (thread_id, thread_name, metadata, last_access)
                            VALUES (%s, %s, %s, CURRENT_TIMESTAMP)
                            ON CONFLICT (thread_id)
                            DO UPDATE SET
                                last_access = CURRENT_TIMESTAMP,
                                thread_name = EXCLUDED.thread_name,
                                metadata = EXCLUDED.metadata
                        """,
                        (thread_id, thread_name, metadata_json),
                    )

                    logger.info(
                        f"Thread {thread_id} registered/updated asynchronously in PostgreSQL"
                    )
        except Exception as e:
            logger.warning(f"Error registering thread asynchronously: {e}")




[docs]
def prepare_merged_input(
    input_data: str | list[str] | dict[str, Any] | BaseModel,
    previous_state: Any | None = None,
    runtime_config: dict[str, Any] | None = None,
    input_schema=None,
    state_schema=None,
) -> Any:
    """Process input data and merge with previous state if available.

    Args:
        input_data: Input data in various formats
        previous_state: Previous state from checkpointer
        runtime_config: Runtime configuration
        input_schema: Schema for input validation
        state_schema: Schema for state validation

    Returns:
        Processed input data merged with previous state
    """
    # Process the input
    processed_input = input_data

    # Return as is if no previous state
    if not previous_state:
        return processed_input

    # Extract values from StateSnapshot if needed
    previous_values = None

    if hasattr(previous_state, "values"):
        # For StateSnapshot objects
        previous_values = previous_state.values
    elif hasattr(previous_state, "channel_values") and previous_state.channel_values:
        # Alternative attribute name
        previous_values = previous_state.channel_values
    elif isinstance(previous_state, dict):
        # Dictionary state
        previous_values = previous_state

    # Return processed input if no valid previous values
    if not previous_values:
        return processed_input

    # Special handling for merging different input types
    if isinstance(processed_input, dict) and isinstance(previous_values, dict):
        # Merge dictionaries
        merged_input = dict(previous_values)

        # Update with new input values
        for key, value in processed_input.items():
            # Special case for messages - append rather than replace
            if key == "messages" and key in previous_values:
                # Start with all previous messages
                merged_messages = list(previous_values["messages"])

                # Add new messages if any
                if key in processed_input:
                    new_messages = value
                    if isinstance(new_messages, list):
                        merged_messages.extend(new_messages)
                    else:
                        merged_messages.append(new_messages)

                # Update merged_input with merged messages
                merged_input["messages"] = merged_messages
            else:
                # For other keys, just override
                merged_input[key] = value

        # Handle shared fields and reducers if using state_schema
        if state_schema:
            # Apply shared field values
            if hasattr(state_schema, "__shared_fields__"):
                for field in state_schema.__shared_fields__:
                    if field in previous_values and field not in processed_input:
                        merged_input[field] = previous_values[field]

            # Apply reducer functions
            if hasattr(state_schema, "__reducer_fields__"):
                for field, reducer in state_schema.__reducer_fields__.items():
                    if field in merged_input and field in previous_values:
                        try:
                            merged_input[field] = reducer(
                                previous_values[field], merged_input[field]
                            )
                        except Exception as e:
                            logger.warning(f"Reducer for {field} failed: {e}")

        # Validate against schema if available
        if state_schema:
            try:
                validated = state_schema(**merged_input)
                # Convert back to dict
                if hasattr(validated, "model_dump"):
                    return validated.model_dump()
                if hasattr(validated, "dict"):
                    return validated.dict()
                return validated
            except Exception as e:
                logger.warning(f"Schema validation failed: {e}")

        return merged_input

    # Return unmodified input as fallback
    return processed_input




[docs]
def get_thread_id_from_config(config: dict[str, Any]) -> str | None:
    """Extract thread_id from a RunnableConfig.

    Args:
        config: Configuration to extract from

    Returns:
        Thread ID if found, None otherwise
    """
    if not config:
        return None

    if isinstance(config, dict) and "configurable" in config:
        return config["configurable"].get("thread_id")

    return None