Core API Reference¶

core.database ¶

Functions¶

dispose_engine `async` ¶

dispose_engine() -> None

Cierra el pool de conexiones limpiamente — llamar antes de shutdown.

Source code in core/database.py

async def dispose_engine() -> None:
    """Cierra el pool de conexiones limpiamente — llamar antes de shutdown."""
    global _async_engine, _async_session_factory, _engine_loop
    if _async_engine is not None:
        await _async_engine.dispose()
        _async_engine = None
        _async_session_factory = None
        _engine_loop = None
        logger.info("🔌 Motor de BD cerrado correctamente")

create_schema `async` ¶

create_schema(schema: str) -> None

Crea un esquema PostgreSQL si no existe (async).

Source code in core/database.py

async def create_schema(schema: str) -> None:
    """Crea un esquema PostgreSQL si no existe (async)."""
    if not re.match(r"^[a-z][a-z0-9_]*$", schema):
        raise ValueError(f"Nombre de schema inválido: '{schema}'")
    engine = _get_async_engine()
    async with engine.begin() as conn:
        await conn.execute(text(f"CREATE SCHEMA IF NOT EXISTS {schema}"))
    logger.info(f"Schema '{schema}' creado/verificado")

create_tables_in_schema `async` ¶

create_tables_in_schema(schema: str) -> None

Crea las tablas SQLModel en el esquema indicado usando el motor async.

Source code in core/database.py

async def create_tables_in_schema(schema: str) -> None:
    """Crea las tablas SQLModel en el esquema indicado usando el motor async."""
    engine = _get_async_engine()
    async with engine.begin() as conn:
        await conn.execute(text(f"SET search_path TO {schema}"))
        await conn.run_sync(SQLModel.metadata.create_all)
    logger.info(f"Tablas creadas en el esquema {schema}")

list_schemas `async` ¶

list_schemas() -> list[str]

Lista los esquemas (workspaces) disponibles.

Source code in core/database.py

async def list_schemas() -> list[str]:
    """Lista los esquemas (workspaces) disponibles."""
    engine = _get_async_engine()
    async with engine.connect() as conn:
        result = await conn.execute(
            text(
                "SELECT schema_name FROM information_schema.schemata "
                "WHERE schema_name NOT LIKE 'pg_%' AND schema_name != 'information_schema'"
            )
        )
        return [row[0] for row in result.fetchall()]

drop_schema `async` ¶

drop_schema(schema: str) -> None

Elimina un esquema y todos sus objetos (CASCADE).

Source code in core/database.py

async def drop_schema(schema: str) -> None:
    """Elimina un esquema y todos sus objetos (CASCADE)."""
    if not re.match(r"^[a-z][a-z0-9_]*$", schema):
        raise ValueError(f"Nombre de schema inválido: '{schema}'")
    engine = _get_async_engine()
    async with engine.begin() as conn:
        await conn.execute(text(f"DROP SCHEMA IF EXISTS {schema} CASCADE"))
    logger.info(f"Schema '{schema}' eliminado")

startup_db `async` ¶

startup_db()

Inicializa el motor y crea tablas en el esquema main.

Alembic se invoca manualmente: poetry run alembic upgrade head

Source code in core/database.py

async def startup_db():
    """Inicializa el motor y crea tablas en el esquema main.

    Alembic se invoca manualmente: poetry run alembic upgrade head
    """
    await create_schema("main")
    await create_tables_in_schema("main")
    logger.info("✅ Base de datos inicializada (tablas creadas en esquema main)")

core.config ¶

Configuración global de Morphix — Settings con pydantic-settings.

Classes¶

Settings ¶

Bases: BaseSettings

Configuración global de Morphix

Source code in core/config.py

class Settings(BaseSettings):
    """Configuración global de Morphix"""

    model_config = SettingsConfigDict(
        env_file=str(ENV_PATH),
        env_file_encoding="utf-8",
        extra="ignore",
    )

    # General
    dark_mode: bool = Field(
        default=True, validation_alias="DARK_MODE", description="Modo oscuro por defecto"
    )
    offline_mode: bool = Field(default=False, validation_alias="OFFLINE_MODE")

    # API Keys
    openai_api_key: str = Field(default="", validation_alias="OPENAI_API_KEY")
    deepseek_api_key: str = Field(default="", validation_alias="DEEPSEEK_API_KEY")
    grok_api_key: str = Field(default="", validation_alias="GROK_API_KEY")
    google_api_key: str = Field(default="", validation_alias="GOOGLE_API_KEY")
    google_cx: str = Field(default="", validation_alias="GOOGLE_CX")
    deepseek_api_base: str = Field(
        default="https://api.deepseek.com",
        validation_alias="DEEPSEEK_API_BASE",
        description="DeepSeek API base URL. Change for proxies or self-hosted deployments.",
    )
    grok_api_base: str = Field(
        default="https://api.x.ai/v1",
        validation_alias="GROK_API_BASE",
        description="Grok API base URL. Change for proxies or self-hosted deployments.",
    )
    hf_token: str = Field(
        default="",
        validation_alias="HF_TOKEN",
        description="HuggingFace API token. Consumed by sentence-transformers/huggingface_hub for model downloads. Without it, anonymous rate limits apply.",
    )

    # Ollama y base de datos
    ollama_base_url: str = Field(
        default="http://localhost:11434", validation_alias="OLLAMA_BASE_URL"
    )
    database_url: str = Field(default="", validation_alias="DATABASE_URL")
    ollama_model: str = Field(default="phi3:mini", validation_alias="OLLAMA_MODEL")
    llm_timeout: int = Field(
        default=60,
        validation_alias="LLM_TIMEOUT",
        description="Timeout for LLM HTTP client connections (used by provider.py).",
    )
    deepseek_strict_mode: bool = Field(
        default=False,
        validation_alias="DEEPSEEK_STRICT_MODE",
        description="Activar strict mode de DeepSeek para forzar respeto de required en tools",
    )
    max_context_tokens: int = Field(
        default=128000,
        validation_alias="MAX_CONTEXT_TOKENS",
        description="Tokens máximos de contexto del modelo",
    )
    redis_url: str = Field(default="redis://localhost:6379/0", validation_alias="REDIS_URL")

    # Default agent names
    default_agent: str = Field(
        default="developer", validation_alias="DEFAULT_AGENT", description="Default agent"
    )
    fallback_agent: str = Field(
        default="conversacional", validation_alias="FALLBACK_AGENT", description="Fallback agent"
    )

    # Seguridad
    encryption_key: str = Field(default="", validation_alias="ENCRYPTION_KEY")
    password_hash: str = Field(default="", validation_alias="PASSWORD_HASH")

    # ==================== MODEL ROLES (centralizado) ====================
    model_roles: dict[str, dict[str, Any]] = Field(
        default_factory=lambda: {
            "default": {"provider": "deepseek", "model": "deepseek-v4-flash", "temperature": 0.7},
            "fast": {"provider": "deepseek", "model": "deepseek-v4-flash", "temperature": 0.3},
            "reasoning": {"provider": "deepseek", "model": "deepseek-v4-flash", "temperature": 0.0},
            "agent": {"provider": "deepseek", "model": "deepseek-v4-flash", "temperature": 0.7},
            "creative": {"provider": "deepseek", "model": "deepseek-v4-flash", "temperature": 0.9},
            "critique": {"provider": "deepseek", "model": "deepseek-v4-flash", "temperature": 0.0},
        },
        description="Model configuration by role. Configure in code (core/config.py). Not settable via .env.",
    )

    @model_validator(mode="after")
    def ensure_encryption_key(self) -> "Settings":
        """Valida que encryption_key exista. En producción lanza error, en desarrollo auto-genera."""
        is_production = os.getenv("MORPHIX_ENV") == "production"
        if not self.encryption_key:
            if is_production:
                logger.critical(
                    "🔑 ENCRYPTION_KEY no configurada en .env. "
                    "En producción es obligatoria. "
                    'Genera una con: python -c "import base64,os; print(base64.urlsafe_b64encode(os.urandom(32)).decode())"'
                )
                raise ValueError(
                    "ENCRYPTION_KEY es obligatoria en producción. "
                    "Configúrala en tu archivo .env."
                )
            generated = base64.urlsafe_b64encode(os.urandom(32)).decode("utf-8")
            self.encryption_key = generated
            logger.warning(
                "🔑 ENCRYPTION_KEY no configurada en .env. Se generó una clave temporal "
                "(solo en desarrollo)."
            )
            logger.warning(
                "⚠️  GUARDA UNA CLAVE en tu .env como ENCRYPTION_KEY=<clave> "
                "o perderás datos encriptados al reiniciar. "
                'Genera una con: python -c "import base64,os; print(base64.urlsafe_b64encode(os.urandom(32)).decode())"'
            )
        else:
            try:
                key_bytes = self.encryption_key.encode()
                Fernet(
                    key_bytes if len(key_bytes) >= 44 else key_bytes + b"=" * (44 - len(key_bytes))
                )
            except Exception:
                logger.error(
                    "❌ ENCRYPTION_KEY en .env no es válida para Fernet (debe ser 32 bytes url-safe base64)."
                )
                if is_production:
                    raise ValueError("ENCRYPTION_KEY inválida en producción.")
        return self

    db_pool_size: int = Field(default=5, validation_alias="DB_POOL_SIZE")
    db_max_overflow: int = Field(default=10, validation_alias="DB_MAX_OVERFLOW")
    db_pool_pre_ping: bool = Field(default=True, validation_alias="DB_POOL_PRE_PING")
    db_pool_recycle: int = Field(default=3600, validation_alias="DB_POOL_RECYCLE")

    # ── Kairos Feature Flags ──
    auto_fix_level: int = Field(default=2, validation_alias="AUTO_FIX_LEVEL")
    context_compression: bool = Field(default=True, validation_alias="CONTEXT_COMPRESSION")
    undercover_mode: bool = Field(default=True, validation_alias="UNDERCOVER_MODE")
    daemon_mode: bool = Field(default=True, validation_alias="DAEMON_MODE")
    self_heal_interval: int = Field(default=120, validation_alias="SELF_HEAL_INTERVAL")
    verbose_logging: bool = Field(default=False, validation_alias="VERBOSE_LOGGING")
    max_subtasks: int = Field(default=8, validation_alias="MAX_SUBTASKS")
    max_agent_iterations: int = Field(default=8, validation_alias="MAX_AGENT_ITERATIONS")
    tools_enabled: bool = Field(default=True, validation_alias="TOOLS_ENABLED")
    allow_code_execution: bool = Field(default=True, validation_alias="ALLOW_CODE_EXECUTION")
    tool_max_retries: int = Field(default=3, validation_alias="TOOL_MAX_RETRIES")
    tool_backoff_base: float = Field(default=1.5, validation_alias="TOOL_BACKOFF_BASE")
    tool_max_tokens_per_workflow: int = Field(
        default=8000, validation_alias="TOOL_MAX_TOKENS_PER_WORKFLOW"
    )
    tool_enable_token_budget: bool = Field(
        default=True, validation_alias="TOOL_ENABLE_TOKEN_BUDGET"
    )
    agent_self_reflection: bool = Field(default=False, validation_alias="AGENT_SELF_REFLECTION")
    default_workflow: str = Field(default="development", validation_alias="DEFAULT_WORKFLOW")
    hooks_enabled: bool = Field(default=True, validation_alias="HOOKS_ENABLED")
    active_workspace: str = Field(default="main", validation_alias="ACTIVE_WORKSPACE")

    # ── LLM Configuration ──
    llm_max_retries: int = Field(default=3, validation_alias="LLM_MAX_RETRIES")
    llm_timeout_seconds: int = Field(
        default=60,
        validation_alias="LLM_TIMEOUT_SECONDS",
        description="Timeout for LLM call operations (used by controller.py Kairos).",
    )
    llm_backoff_factor: float = Field(default=1.5, validation_alias="LLM_BACKOFF_FACTOR")
    llm_rate_per_minute: int = Field(default=20, validation_alias="LLM_RATE_PER_MINUTE")
    llm_rate_per_hour: int = Field(default=200, validation_alias="LLM_RATE_PER_HOUR")

Functions¶

ensure_encryption_key ¶

ensure_encryption_key() -> Settings

Valida que encryption_key exista. En producción lanza error, en desarrollo auto-genera.

Source code in core/config.py

@model_validator(mode="after")
def ensure_encryption_key(self) -> "Settings":
    """Valida que encryption_key exista. En producción lanza error, en desarrollo auto-genera."""
    is_production = os.getenv("MORPHIX_ENV") == "production"
    if not self.encryption_key:
        if is_production:
            logger.critical(
                "🔑 ENCRYPTION_KEY no configurada en .env. "
                "En producción es obligatoria. "
                'Genera una con: python -c "import base64,os; print(base64.urlsafe_b64encode(os.urandom(32)).decode())"'
            )
            raise ValueError(
                "ENCRYPTION_KEY es obligatoria en producción. "
                "Configúrala en tu archivo .env."
            )
        generated = base64.urlsafe_b64encode(os.urandom(32)).decode("utf-8")
        self.encryption_key = generated
        logger.warning(
            "🔑 ENCRYPTION_KEY no configurada en .env. Se generó una clave temporal "
            "(solo en desarrollo)."
        )
        logger.warning(
            "⚠️  GUARDA UNA CLAVE en tu .env como ENCRYPTION_KEY=<clave> "
            "o perderás datos encriptados al reiniciar. "
            'Genera una con: python -c "import base64,os; print(base64.urlsafe_b64encode(os.urandom(32)).decode())"'
        )
    else:
        try:
            key_bytes = self.encryption_key.encode()
            Fernet(
                key_bytes if len(key_bytes) >= 44 else key_bytes + b"=" * (44 - len(key_bytes))
            )
        except Exception:
            logger.error(
                "❌ ENCRYPTION_KEY en .env no es válida para Fernet (debe ser 32 bytes url-safe base64)."
            )
            if is_production:
                raise ValueError("ENCRYPTION_KEY inválida en producción.")
    return self

core.path_resolver ¶

PathResolver — resolución centralizada de rutas del sistema. Elimina hardcodeos de Path("memory"), Path("workspaces"), Path("graficos"), etc.

Classes¶

PathResolver ¶

Provee rutas canónicas para todos los subsistemas.

Source code in core/path_resolver.py

class PathResolver:
    """Provee rutas canónicas para todos los subsistemas."""

    @staticmethod
    def memory_base() -> Path:
        return MEMORY_BASE

    @staticmethod
    def memory_dir(workspace: str) -> Path:
        return MEMORY_BASE / workspace

    @staticmethod
    def code_projects_dir(workspace: str, project_root: str | None = None) -> Path:
        base = MEMORY_BASE / workspace
        if project_root:
            base = base / project_root
        return base

    @staticmethod
    def workspaces_base() -> Path:
        return WORKSPACES_BASE

    @staticmethod
    def workspace_dir(workspace: str) -> Path:
        return WORKSPACES_BASE / workspace

    @staticmethod
    def workspace_agents_dir(workspace: str) -> Path:
        return WORKSPACES_BASE / workspace / "agents"

    @staticmethod
    def workspace_hooks_dir(workspace: str) -> Path:
        return WORKSPACES_BASE / workspace / "hooks"

    @staticmethod
    def mcp_servers_file(workspace: str) -> Path:
        return WORKSPACES_BASE / workspace / "mcp_servers.json"

    @staticmethod
    def workspace_tools_dir(workspace: str) -> Path:
        return WORKSPACES_BASE / workspace / "tools"

    @staticmethod
    def workspace_workflows_dir(workspace: str) -> Path:
        return WORKSPACES_BASE / workspace / "workflows"

    @staticmethod
    def templates_dir() -> Path:
        return TEMPLATES_DIR

    @staticmethod
    def templates_agents_dir() -> Path:
        return TEMPLATES_DIR / "agents"

    @staticmethod
    def templates_hooks_dir() -> Path:
        return TEMPLATES_DIR / "hooks"

    @staticmethod
    def templates_workflows_dir() -> Path:
        return TEMPLATES_DIR / "workflows"

    @staticmethod
    def charts_dir() -> Path:
        return CHARTS_DIR

    @staticmethod
    def exports_dir() -> Path:
        return EXPORTS_DIR

    @staticmethod
    def log_file() -> Path:
        return LOG_FILE

    @staticmethod
    def analytics_charts_dir() -> Path:
        return ANALYTICS_CHARTS_DIR

    @staticmethod
    def normalize_path(file_path: str, project_root: str | None = None) -> str:
        """Normaliza una ruta relativa eliminando el prefijo project_root si está presente.

        Casos:
          file_path='code_projects/miapp/src/main.py', project_root='code_projects/miapp'
            → 'src/main.py'
          file_path='miapp/src/main.py', project_root='code_projects/miapp'
            → 'src/main.py' (el último componente 'miapp' se elimina)
          file_path='src/main.py', project_root='code_projects/miapp'
            → 'src/main.py' (sin cambios)

        Fuente única de verdad para normalización de rutas en todo el sistema.
        """
        if not project_root:
            return file_path

        project_parts = Path(project_root).parts
        path_parts = Path(file_path).parts

        # Case 1: path starts with full project_root
        if (
            len(path_parts) >= len(project_parts)
            and path_parts[: len(project_parts)] == project_parts
        ):
            relative_parts = path_parts[len(project_parts) :]
            return "/".join(relative_parts) if relative_parts else "."

        # Case 2: path starts with the last component of project_root (project name)
        last_part = project_parts[-1]  # ej: "miapp"
        if path_parts and path_parts[0] == last_part:
            relative_parts = path_parts[1:]
            return "/".join(relative_parts) if relative_parts else "."

        return file_path

    @staticmethod
    def normalize_project_root(project_root: str | None) -> str | None:
        """Asegura que project_root tenga el prefijo 'code_projects/'."""
        if project_root and not str(project_root).startswith("code_projects/"):
            return f"code_projects/{project_root}"
        return project_root

Functions¶

normalize_path `staticmethod` ¶

normalize_path(
    file_path: str, project_root: str | None = None
) -> str

Normaliza una ruta relativa eliminando el prefijo project_root si está presente.

Casos

file_path='code_projects/miapp/src/main.py', project_root='code_projects/miapp' → 'src/main.py' file_path='miapp/src/main.py', project_root='code_projects/miapp' → 'src/main.py' (el último componente 'miapp' se elimina) file_path='src/main.py', project_root='code_projects/miapp' → 'src/main.py' (sin cambios)

Fuente única de verdad para normalización de rutas en todo el sistema.

Source code in core/path_resolver.py

@staticmethod
def normalize_path(file_path: str, project_root: str | None = None) -> str:
    """Normaliza una ruta relativa eliminando el prefijo project_root si está presente.

    Casos:
      file_path='code_projects/miapp/src/main.py', project_root='code_projects/miapp'
        → 'src/main.py'
      file_path='miapp/src/main.py', project_root='code_projects/miapp'
        → 'src/main.py' (el último componente 'miapp' se elimina)
      file_path='src/main.py', project_root='code_projects/miapp'
        → 'src/main.py' (sin cambios)

    Fuente única de verdad para normalización de rutas en todo el sistema.
    """
    if not project_root:
        return file_path

    project_parts = Path(project_root).parts
    path_parts = Path(file_path).parts

    # Case 1: path starts with full project_root
    if (
        len(path_parts) >= len(project_parts)
        and path_parts[: len(project_parts)] == project_parts
    ):
        relative_parts = path_parts[len(project_parts) :]
        return "/".join(relative_parts) if relative_parts else "."

    # Case 2: path starts with the last component of project_root (project name)
    last_part = project_parts[-1]  # ej: "miapp"
    if path_parts and path_parts[0] == last_part:
        relative_parts = path_parts[1:]
        return "/".join(relative_parts) if relative_parts else "."

    return file_path

normalize_project_root `staticmethod` ¶

normalize_project_root(
    project_root: str | None,
) -> str | None

Asegura que project_root tenga el prefijo 'code_projects/'.

Source code in core/path_resolver.py

@staticmethod
def normalize_project_root(project_root: str | None) -> str | None:
    """Asegura que project_root tenga el prefijo 'code_projects/'."""
    if project_root and not str(project_root).startswith("code_projects/"):
        return f"code_projects/{project_root}"
    return project_root

core.health ¶

Health check — runtime connectivity probes.

Usage: poetry run python -m core.health

Classes¶

HealthReport `dataclass` ¶

Structured health check result for all services.

Source code in core/health.py

@dataclass
class HealthReport:
    """Structured health check result for all services."""

    timestamp: float = field(default_factory=time.time)
    checks: dict[str, dict[str, Any]] = field(default_factory=dict)
    all_ok: bool = True

    def add(self, name: str, ok: bool, detail: str = "", **extra) -> None:
        self.checks[name] = {"ok": ok, "detail": detail, **extra}
        if not ok:
            self.all_ok = False

    def format(self) -> str:
        lines = ["═══ Morphix Health Check ═══"]
        for name, check in self.checks.items():
            icon = "✅" if check["ok"] else "❌"
            lines.append(f"  {icon} {name}: {check['detail']}")
        lines.append("════════════════════════════")
        lines.append(f"Overall: {'✅ ALL OK' if self.all_ok else '❌ ISSUES DETECTED'}")
        return "\n".join(lines)

Functions¶

check_database `async` ¶

check_database(report: HealthReport) -> None

Probe PostgreSQL connectivity with async SELECT 1.

Source code in core/health.py

async def check_database(report: HealthReport) -> None:
    """Probe PostgreSQL connectivity with async SELECT 1."""
    from core.config import settings

    if not settings.database_url:
        report.add("Database", False, "DATABASE_URL not configured")
        return

    try:
        from sqlalchemy import text
        from sqlalchemy.ext.asyncio import create_async_engine

        url = settings.database_url.replace("postgresql://", "postgresql+asyncpg://")
        engine = create_async_engine(url, echo=False)
        async with engine.connect() as conn:
            start = time.monotonic()
            result = await conn.execute(text("SELECT 1"))
            result.fetchone()
            elapsed = time.monotonic() - start
        await engine.dispose()
        report.add("Database", True, f"OK ({elapsed * 1000:.0f}ms)")
    except Exception as e:
        report.add("Database", False, str(e)[:120])

check_llm `async` ¶

check_llm(report: HealthReport) -> None

Probe LLM provider reachability with a fast connectivity check.

Source code in core/health.py

async def check_llm(report: HealthReport) -> None:
    """Probe LLM provider reachability with a fast connectivity check."""
    import httpx

    from core.config import settings

    provider = "deepseek"
    role_config = settings.model_roles.get("default", {})
    provider_name = role_config.get("provider", "deepseek")

    try:
        async with httpx.AsyncClient(timeout=5.0) as client:
            start = time.monotonic()
            if provider_name == "deepseek":
                resp = await client.get("https://api.deepseek.com/v1/models")
            elif provider_name == "openai":
                resp = await client.get("https://api.openai.com/v1/models")
            else:
                resp = await client.get(f"https://api.{provider_name}.com")
            elapsed = time.monotonic() - start
            if resp.status_code in (200, 401, 403):
                report.add(
                    "LLM",
                    True,
                    f"{provider_name} reachable ({elapsed * 1000:.0f}ms)",
                )
            else:
                report.add("LLM", False, f"{provider_name} returned {resp.status_code}")
    except Exception as e:
        report.add("LLM", False, str(e)[:120])

check_redis `async` ¶

check_redis(report: HealthReport) -> None

Probe Redis connectivity if configured.

Source code in core/health.py

async def check_redis(report: HealthReport) -> None:
    """Probe Redis connectivity if configured."""
    from core.config import settings

    if not settings.redis_url or settings.redis_url == "redis://localhost:6379/0":
        report.add("Redis", True, "not configured (default)")
        return

    try:
        import redis.asyncio as redis

        r = redis.from_url(settings.redis_url)
        start = time.monotonic()
        await r.ping()  # type: ignore[misc]
        elapsed = time.monotonic() - start
        await r.aclose()
        report.add("Redis", True, f"OK ({elapsed * 1000:.0f}ms)")
    except Exception as e:
        report.add("Redis", False, str(e)[:120])

check_filesystem ¶

check_filesystem(report: HealthReport) -> None

Probe critical directories and workspace integrity.

Source code in core/health.py

def check_filesystem(report: HealthReport) -> None:
    """Probe critical directories and workspace integrity."""
    from core.path_resolver import MEMORY_BASE, TEMPLATES_DIR

    try:
        ok = MEMORY_BASE.exists()
        report.add("Memory Dir", ok, str(MEMORY_BASE) if ok else "missing")
    except Exception as e:
        report.add("Memory Dir", False, str(e)[:120])

    try:
        ok = TEMPLATES_DIR.exists()
        templates_count = len(list(TEMPLATES_DIR.glob("**/*.yaml"))) if ok else 0
        report.add(
            "Templates",
            ok,
            f"{templates_count} YAML files" if ok else "missing",
        )
    except Exception as e:
        report.add("Templates", False, str(e)[:120])

check_workspace ¶

check_workspace(report: HealthReport) -> None

Probe current workspace integrity.

Source code in core/health.py

def check_workspace(report: HealthReport) -> None:
    """Probe current workspace integrity."""
    from core.workflow_state import get_active_workflow

    try:
        wf = get_active_workflow()
        report.add("Workspace", True, f"active workflow: {wf}")
    except Exception as e:
        report.add("Workspace", False, str(e)[:120])

run_health_check `async` ¶

run_health_check() -> HealthReport

Run all health checks and return a structured report.

Source code in core/health.py

async def run_health_check() -> HealthReport:
    """Run all health checks and return a structured report."""
    report = HealthReport()

    check_filesystem(report)
    check_workspace(report)
    await check_database(report)
    await check_llm(report)
    await check_redis(report)

    return report

core.bootstrap ¶

Bootstrap — inicialización del backend para el modo desktop PySide6.

Functions¶

validate_config ¶

validate_config() -> tuple[bool, list[str]]

Validate critical configuration at startup.

Returns (valid: bool, warnings: list[str]). Fatal errors raise ValueError. Warnings are non-blocking.

Source code in core/bootstrap.py

def validate_config() -> tuple[bool, list[str]]:
    """Validate critical configuration at startup.

    Returns (valid: bool, warnings: list[str]).
    Fatal errors raise ValueError. Warnings are non-blocking.
    """
    from core.config import settings

    errors: list[str] = []
    warnings: list[str] = []

    # DATABASE_URL is required
    if not settings.database_url:
        errors.append("DATABASE_URL is not set. Copy example.env to .env and configure it.")

    # At least one API key (unless offline mode)
    if not settings.offline_mode:
        has_key = any(
            [
                settings.openai_api_key,
                settings.deepseek_api_key,
                settings.grok_api_key,
            ]
        )
        if not has_key:
            warnings.append(
                "No API keys configured (OPENAI_API_KEY, DEEPSEEK_API_KEY, or GROK_API_KEY). "
                "Enable OFFLINE_MODE=true to use Ollama locally."
            )

    # ENCRYPTION_KEY in production
    from core.config import os as _os

    morphix_env = _os.getenv("MORPHIX_ENV", "development")
    if morphix_env == "production" and not settings.encryption_key:
        errors.append("ENCRYPTION_KEY is required in production (MORPHIX_ENV=production).")

    # Critical directory existence
    from core.path_resolver import MEMORY_BASE, TEMPLATES_DIR

    if not MEMORY_BASE.exists():
        warnings.append(f"Memory base directory missing: {MEMORY_BASE}")

    if not TEMPLATES_DIR.exists():
        warnings.append(f"Templates directory missing: {TEMPLATES_DIR}")

    if errors:
        raise ValueError("Configuration errors:\n- " + "\n- ".join(errors))

    return True, warnings

init_backend `async` ¶

init_backend(
    workspace: str | None = None,
    on_progress: Callable[[str], None] | None = None,
) -> bool

Inicializa BD, workspace, y agentes.

Source code in core/bootstrap.py

async def init_backend(
    workspace: str | None = None,
    on_progress: Callable[[str], None] | None = None,
) -> bool:
    """Inicializa BD, workspace, y agentes."""
    if workspace is None:
        from core.config import settings

        workspace = settings.active_workspace
    try:
        from core.database import startup_db

        if on_progress:
            on_progress("Conectando a base de datos...")
        await startup_db()
        logger.info("Base de datos inicializada")
    except Exception as e:
        logger.critical(f"Error initializing DB: {e}")
        if on_progress:
            on_progress(f"Error BD: {e}")
        return False

    try:
        from core.workspaces import get_global_workspaces

        if on_progress:
            on_progress(f"Activando workspace '{workspace}'...")
        ws = get_global_workspaces()
        await ws.switch_workspace(workspace)
        logger.info(f"Workspace '{workspace}' activado")
    except Exception as e:
        logger.critical(f"Error activando workspace: {e}")
        if on_progress:
            on_progress(f"Error workspace: {e}")
        return False

    try:
        from core.hook_loader import load_global_hooks

        load_global_hooks()
        logger.info("Global hooks loaded")
    except Exception as e:
        logger.warning(f"Error loading global hooks: {e}")

    return True

start_daemons `async` ¶

start_daemons(
    on_offline_changed: Callable[[bool], Any] | None = None,
) -> None

Arranca tareas de fondo: Kairos Daemon y OfflineManager. on_offline_changed: callback opcional async para notificar cambios de estado offline.

Source code in core/bootstrap.py

async def start_daemons(on_offline_changed: Callable[[bool], Any] | None = None) -> None:
    """Arranca tareas de fondo: Kairos Daemon y OfflineManager.
    on_offline_changed: callback opcional async para notificar cambios de estado offline.
    """
    global _daemon_tasks

    from core.config import settings
    from core.feature_flags import kairos

    if settings.daemon_mode:
        logger.info("✅ Kairos Daemon Mode activado")
        _daemon_tasks.append(asyncio.create_task(kairos.daemon_loop()))

    from llm import OfflineManager

    om = OfflineManager()
    await om.detect()

    async def _periodic_offline_check():
        was_offline = om.is_offline()
        while True:
            try:
                await asyncio.sleep(300)
                await om.detect()
                is_offline = om.is_offline()
                if is_offline != was_offline:
                    logger.info(f"Offline status changed: {is_offline}")
                    was_offline = is_offline
                    if on_offline_changed is not None:
                        await on_offline_changed(is_offline)
            except asyncio.CancelledError:
                break

    _daemon_tasks.append(asyncio.create_task(_periodic_offline_check()))
    logger.info("OfflineManager iniciado")

stop_daemons `async` ¶

stop_daemons() -> None

Cancela todas las tareas de fondo limpiamente.

Source code in core/bootstrap.py

async def stop_daemons() -> None:
    """Cancela todas las tareas de fondo limpiamente."""
    global _daemon_tasks
    for task in _daemon_tasks:
        task.cancel()
    if _daemon_tasks:
        await asyncio.gather(*_daemon_tasks, return_exceptions=True)
    _daemon_tasks.clear()
    logger.info("Daemons detenidos")

core.feature_flags ¶

Kairos Feature Flags + Daemon Mode (Claude Code Style - Marzo 2026)

Classes¶

KairosFlags ¶

Source code in core/feature_flags.py

class KairosFlags:
    _instance = None
    _lock = threading.RLock()

    def __new__(cls):
        if cls._instance is None:
            with cls._lock:
                if cls._instance is None:
                    cls._instance = super().__new__(cls)
                    cls._instance._init_flags()
        return cls._instance

    def _init_flags(self):
        from core.config import settings as app_settings

        self.flags: dict[str, Any] = {
            "AUTO_FIX_LEVEL": app_settings.auto_fix_level,
            "CONTEXT_COMPRESSION": app_settings.context_compression,
            "UNDERCOVER_MODE": app_settings.undercover_mode,
            "DAEMON_MODE": app_settings.daemon_mode,
            "SELF_HEAL_INTERVAL": app_settings.self_heal_interval,
            "VERBOSE_LOGGING": app_settings.verbose_logging,
            "MAX_SUBTASKS": app_settings.max_subtasks,
            "tools_enabled": app_settings.tools_enabled,
            "allow_code_execution": app_settings.allow_code_execution,
            "tool_max_retries": app_settings.tool_max_retries,
            "tool_backoff_base": app_settings.tool_backoff_base,
            "tool_max_tokens_per_workflow": app_settings.tool_max_tokens_per_workflow,
            "tool_enable_token_budget": app_settings.tool_enable_token_budget,
            "AGENT_SELF_REFLECTION": app_settings.agent_self_reflection,
            "HOOKS_ENABLED": app_settings.hooks_enabled,
        }
        # Flags que se han modificado en caliente (no recargar del .env)
        self._dirty_flags: set[str] = set()
        logger.info("🚀 Kairos Feature Flags inicializados")
        logger.info(f"   DAEMON_MODE: {self.flags['DAEMON_MODE']}")
        logger.info(f"   TOOLS_ENABLED: {self.flags['tools_enabled']}")
        logger.info(f"   ALLOW_CODE_EXECUTION: {self.flags['allow_code_execution']}")
        logger.info(
            f"   TOOL_MAX_TOKENS_PER_WORKFLOW: {self.flags['tool_max_tokens_per_workflow']}"
        )

    def get(self, key: str, default: Any = None) -> Any:
        """Obtener flag. Solo recarga del .env si no fue modificado en caliente."""
        # If the flag was already changed manually, don't overwrite from the environment
        if key not in self._dirty_flags:
            env_value = os.getenv(key)
            if env_value is not None:
                if isinstance(self.flags.get(key), bool):
                    self.flags[key] = env_value.lower() == "true"
                elif isinstance(self.flags.get(key), int):
                    self.flags[key] = int(env_value)
                elif isinstance(self.flags.get(key), float):
                    self.flags[key] = float(env_value)
                else:
                    self.flags[key] = env_value
        return self.flags.get(key, default)

    def set(self, key: str, value: Any):
        """Cambiar flag en runtime (marcado como manual para evitar hot-reload)."""
        self.flags[key] = value
        self._dirty_flags.add(key)
        logger.info(f"🔄 Flag actualizado: {key} = {value}")

    async def daemon_loop(self):
        """Modo Daemon siempre activo"""
        logger.info("🔄 Kairos Daemon iniciado - Modo siempre activo")
        try:
            while True:
                try:
                    if self.get("DAEMON_MODE"):

                        await memory.write_system(
                            "kairos_daemon_heartbeat",
                            {
                                "timestamp": time.time(),
                                "flags_active": len([k for k, v in self.flags.items() if v]),
                                "auto_fix_level": self.get("AUTO_FIX_LEVEL"),
                            },
                        )

                        await memory.self_healing_check()
                        logger.debug("💓 Daemon heartbeat enviado")
                    await asyncio.sleep(self.get("SELF_HEAL_INTERVAL"))
                except Exception as e:
                    logger.error("Error en daemon loop: %s", e, exc_info=True)
                    await asyncio.sleep(10)
        except asyncio.CancelledError:
            logger.info("Kairos Daemon cancelado")

Functions¶

get ¶

get(key: str, default: Any = None) -> Any

Obtener flag. Solo recarga del .env si no fue modificado en caliente.

Source code in core/feature_flags.py

def get(self, key: str, default: Any = None) -> Any:
    """Obtener flag. Solo recarga del .env si no fue modificado en caliente."""
    # If the flag was already changed manually, don't overwrite from the environment
    if key not in self._dirty_flags:
        env_value = os.getenv(key)
        if env_value is not None:
            if isinstance(self.flags.get(key), bool):
                self.flags[key] = env_value.lower() == "true"
            elif isinstance(self.flags.get(key), int):
                self.flags[key] = int(env_value)
            elif isinstance(self.flags.get(key), float):
                self.flags[key] = float(env_value)
            else:
                self.flags[key] = env_value
    return self.flags.get(key, default)

set ¶

set(key: str, value: Any)

Cambiar flag en runtime (marcado como manual para evitar hot-reload).

Source code in core/feature_flags.py

def set(self, key: str, value: Any):
    """Cambiar flag en runtime (marcado como manual para evitar hot-reload)."""
    self.flags[key] = value
    self._dirty_flags.add(key)
    logger.info(f"🔄 Flag actualizado: {key} = {value}")

daemon_loop `async` ¶

daemon_loop()

Modo Daemon siempre activo

Source code in core/feature_flags.py

async def daemon_loop(self):
    """Modo Daemon siempre activo"""
    logger.info("🔄 Kairos Daemon iniciado - Modo siempre activo")
    try:
        while True:
            try:
                if self.get("DAEMON_MODE"):

                    await memory.write_system(
                        "kairos_daemon_heartbeat",
                        {
                            "timestamp": time.time(),
                            "flags_active": len([k for k, v in self.flags.items() if v]),
                            "auto_fix_level": self.get("AUTO_FIX_LEVEL"),
                        },
                    )

                    await memory.self_healing_check()
                    logger.debug("💓 Daemon heartbeat enviado")
                await asyncio.sleep(self.get("SELF_HEAL_INTERVAL"))
            except Exception as e:
                logger.error("Error en daemon loop: %s", e, exc_info=True)
                await asyncio.sleep(10)
    except asyncio.CancelledError:
        logger.info("Kairos Daemon cancelado")

core.circuit_breaker ¶

Circuit Breaker — protege contra fallos en cascada en llamadas externas.

Implementa el patrón Circuit Breaker para proveedores LLM: - CLOSED: operación normal, se envían requests - OPEN: demasiados fallos consecutivos, se rechazan requests inmediatamente - HALF_OPEN: timeout de recuperación expirado, se permite un request de prueba

Classes¶

CircuitBreaker `dataclass` ¶

Circuit breaker para un proveedor externo.

Parameters:

Name	Type	Description	Default
`failure_threshold`	`int`	fallos consecutivos para abrir el circuito	`5`
`recovery_timeout`	`float`	segundos antes de intentar half-open	`30.0`

Source code in core/circuit_breaker.py

@dataclass
class CircuitBreaker:
    """Circuit breaker para un proveedor externo.

    Args:
        failure_threshold: fallos consecutivos para abrir el circuito
        recovery_timeout: segundos antes de intentar half-open
    """

    failure_threshold: int = 5
    recovery_timeout: float = 30.0
    _lock: threading.Lock = field(default_factory=threading.Lock, repr=False)
    _state: str = field(default="closed", init=False)
    _failures: int = field(default=0, init=False)
    _last_failure_time: float = field(default=0.0, init=False)

    def allow_request(self) -> bool:
        """True si el request debe enviarse, False si debe rechazarse (circuito abierto)."""
        with self._lock:
            if self._state == "closed":
                return True
            if self._state == "open":
                if time.time() - self._last_failure_time >= self.recovery_timeout:
                    self._state = "half_open"
                    return True
                return False
            # half_open: allow one probe request
            return True

    def record_success(self) -> None:
        """Cierra el circuito tras un request exitoso."""
        with self._lock:
            self._state = "closed"
            self._failures = 0

    def record_failure(self) -> None:
        """Registra un fallo. Si se supera el umbral, abre el circuito."""
        with self._lock:
            self._failures += 1
            self._last_failure_time = time.time()
            if self._failures >= self.failure_threshold:
                self._state = "open"

    @property
    def is_open(self) -> bool:
        with self._lock:
            return self._state == "open"

    @property
    def state(self) -> str:
        with self._lock:
            return self._state

    @property
    def failure_count(self) -> int:
        with self._lock:
            return self._failures

Functions¶

allow_request ¶

allow_request() -> bool

True si el request debe enviarse, False si debe rechazarse (circuito abierto).

Source code in core/circuit_breaker.py

def allow_request(self) -> bool:
    """True si el request debe enviarse, False si debe rechazarse (circuito abierto)."""
    with self._lock:
        if self._state == "closed":
            return True
        if self._state == "open":
            if time.time() - self._last_failure_time >= self.recovery_timeout:
                self._state = "half_open"
                return True
            return False
        # half_open: allow one probe request
        return True

record_success ¶

record_success() -> None

Cierra el circuito tras un request exitoso.

Source code in core/circuit_breaker.py

def record_success(self) -> None:
    """Cierra el circuito tras un request exitoso."""
    with self._lock:
        self._state = "closed"
        self._failures = 0

record_failure ¶

record_failure() -> None

Registra un fallo. Si se supera el umbral, abre el circuito.

Source code in core/circuit_breaker.py

def record_failure(self) -> None:
    """Registra un fallo. Si se supera el umbral, abre el circuito."""
    with self._lock:
        self._failures += 1
        self._last_failure_time = time.time()
        if self._failures >= self.failure_threshold:
            self._state = "open"

CircuitBreakerRegistry ¶

Registro global de circuit breakers por proveedor.

Source code in core/circuit_breaker.py

class CircuitBreakerRegistry:
    """Registro global de circuit breakers por proveedor."""

    _breakers: dict[str, CircuitBreaker] = {}
    _lock: threading.Lock = threading.Lock()

    @classmethod
    def get(cls, provider: str) -> CircuitBreaker:
        with cls._lock:
            if provider not in cls._breakers:
                cls._breakers[provider] = CircuitBreaker()
            return cls._breakers[provider]

    @classmethod
    def reset_all(cls) -> None:
        with cls._lock:
            cls._breakers.clear()

    @classmethod
    def get_all_states(cls) -> dict[str, dict]:
        with cls._lock:
            return {
                name: {"state": cb.state, "failures": cb.failure_count}
                for name, cb in cls._breakers.items()
            }

core.rate_limiter ¶

Rate Limiter — control de consumo de llamadas LLM.

Sliding window: limita el número de llamadas por minuto y por hora. Configurable desde Kairos feature flags.

Classes¶

RateLimiter ¶

Rate limiter con sliding window para llamadas LLM.

Source code in core/rate_limiter.py

class RateLimiter:
    """Rate limiter con sliding window para llamadas LLM."""

    def __init__(self, max_per_minute: int = 20, max_per_hour: int = 200):
        self.max_per_minute = max_per_minute
        self.max_per_hour = max_per_hour
        self._minute_window: deque[float] = deque()
        self._hour_window: deque[float] = deque()
        self._lock = asyncio.Lock()

    async def acquire(self) -> bool:
        """Intenta adquirir un slot. Retorna True si está permitido, False si debe esperar."""
        async with self._lock:
            now = time.time()
            # Clean old entries
            while self._minute_window and now - self._minute_window[0] > 60:
                self._minute_window.popleft()
            while self._hour_window and now - self._hour_window[0] > 3600:
                self._hour_window.popleft()

            if len(self._minute_window) >= self.max_per_minute:
                return False
            if len(self._hour_window) >= self.max_per_hour:
                return False

            self._minute_window.append(now)
            self._hour_window.append(now)
            return True

    async def wait_and_acquire(self, timeout: float = 30) -> bool:
        """Espera hasta que haya un slot disponible o se alcance el timeout."""
        deadline = time.time() + timeout
        while time.time() < deadline:
            if await self.acquire():
                return True
            await asyncio.sleep(1)
        return False

    async def remaining(self) -> int:
        """Número de slots disponibles en la ventana actual."""
        async with self._lock:
            now = time.time()
            while self._minute_window and now - self._minute_window[0] > 60:
                self._minute_window.popleft()
            return max(0, self.max_per_minute - len(self._minute_window))

    @property
    def current_minute_count(self) -> int:
        return len(self._minute_window)

    @property
    def current_hour_count(self) -> int:
        return len(self._hour_window)

Functions¶

acquire `async` ¶

acquire() -> bool

Intenta adquirir un slot. Retorna True si está permitido, False si debe esperar.

Source code in core/rate_limiter.py

async def acquire(self) -> bool:
    """Intenta adquirir un slot. Retorna True si está permitido, False si debe esperar."""
    async with self._lock:
        now = time.time()
        # Clean old entries
        while self._minute_window and now - self._minute_window[0] > 60:
            self._minute_window.popleft()
        while self._hour_window and now - self._hour_window[0] > 3600:
            self._hour_window.popleft()

        if len(self._minute_window) >= self.max_per_minute:
            return False
        if len(self._hour_window) >= self.max_per_hour:
            return False

        self._minute_window.append(now)
        self._hour_window.append(now)
        return True

wait_and_acquire `async` ¶

wait_and_acquire(timeout: float = 30) -> bool

Espera hasta que haya un slot disponible o se alcance el timeout.

Source code in core/rate_limiter.py

async def wait_and_acquire(self, timeout: float = 30) -> bool:
    """Espera hasta que haya un slot disponible o se alcance el timeout."""
    deadline = time.time() + timeout
    while time.time() < deadline:
        if await self.acquire():
            return True
        await asyncio.sleep(1)
    return False

remaining `async` ¶

remaining() -> int

Número de slots disponibles en la ventana actual.

Source code in core/rate_limiter.py

async def remaining(self) -> int:
    """Número de slots disponibles en la ventana actual."""
    async with self._lock:
        now = time.time()
        while self._minute_window and now - self._minute_window[0] > 60:
            self._minute_window.popleft()
        return max(0, self.max_per_minute - len(self._minute_window))

core.token_counter ¶

Token Counter — carga lazy de tiktoken.

Centraliza la codificación cl100k_base para evitar cargarla en 4 lugares distintos.

Functions¶

get_encoding ¶

get_encoding()

Return the tiktoken cl100k_base encoding with lazy loading.

La primera llamada carga el encoding (~1-2 MB, ~100ms). Llamadas subsecuentes retornan la instancia cacheada.

Source code in core/token_counter.py

def get_encoding():
    """Return the tiktoken cl100k_base encoding with lazy loading.

    La primera llamada carga el encoding (~1-2 MB, ~100ms).
    Llamadas subsecuentes retornan la instancia cacheada.
    """
    global _enc
    if _enc is None:
        try:
            import tiktoken

            _enc = tiktoken.get_encoding("cl100k_base")
        except ImportError:
            logger.warning("tiktoken no instalado. Conteo de tokens no disponible.")
            return None
        except Exception as e:
            logger.warning(f"Error cargando tiktoken: {e}")
            return None
    return _enc

core.cache_manager ¶

Prompt Cache Manager — multi-provider cache abstraction.

DeepSeek (now): Automatic server-side disk caching. No client API needed. We monitor cache hit/miss via response.usage fields.

Anthropic (future): Client-controlled ephemeral caching via cache_control markers. We inject {"type": "ephemeral"} on system/tools messages.

OpenAI (future): Automatic prompt caching (newer models). Monitor like DeepSeek.

Design

CacheManager is a singleton that accumulates per-workspace cache stats.
track_usage() extracts prompt_cache_hit_tokens / prompt_cache_miss_tokens from any provider response.
get_stats() returns hit rate and token savings for reporting.
stabilize_messages() is a helper that keeps the message prefix intact (critical for DeepSeek's prefix-based disk caching).

Classes¶

CacheManager ¶

Source code in core/cache_manager.py

class CacheManager:
    _instance = None
    _lock = threading.RLock()

    def __new__(cls):
        if cls._instance is None:
            with cls._lock:
                if cls._instance is None:
                    cls._instance = super().__new__(cls)
                    cls._instance._init()
        return cls._instance

    def _init(self) -> None:
        self._global_stats = CacheStats()
        self._workspace_stats: dict[str, CacheStats] = {}
        logger.info("Prompt Cache Manager initialized (DeepSeek auto-cache)")

    def track_usage(
        self,
        prompt_tokens: int = 0,
        completion_tokens: int = 0,
        prompt_cache_hit_tokens: int = 0,
        prompt_cache_miss_tokens: int = 0,
        workspace: str = "main",
    ) -> None:
        """Record token usage and cache metrics from an LLM response."""
        with self._lock:
            # Global stats
            self._global_stats.total_prompt_tokens += prompt_tokens
            self._global_stats.cache_hit_tokens += prompt_cache_hit_tokens
            self._global_stats.cache_miss_tokens += prompt_cache_miss_tokens
            self._global_stats.total_completion_tokens += completion_tokens
            self._global_stats.llm_calls += 1
            self._global_stats.last_updated = time.time()

            # Per-workspace stats
            ws = self._workspace_stats.setdefault(workspace, CacheStats())
            ws.total_prompt_tokens += prompt_tokens
            ws.cache_hit_tokens += prompt_cache_hit_tokens
            ws.cache_miss_tokens += prompt_cache_miss_tokens
            ws.total_completion_tokens += completion_tokens
            ws.llm_calls += 1
            ws.last_updated = time.time()

            if prompt_cache_hit_tokens > 0 or prompt_cache_miss_tokens > 0:
                hit_rate = (
                    prompt_cache_hit_tokens
                    / (prompt_cache_hit_tokens + prompt_cache_miss_tokens)
                    * 100
                )
                logger.debug(
                    f"DeepSeek cache: {prompt_cache_hit_tokens} hit / "
                    f"{prompt_cache_miss_tokens} miss "
                    f"({hit_rate:.0f}% hit rate)"
                )

    def get_stats(self, workspace: str | None = None) -> dict[str, Any]:
        """Return cache statistics as a dict for reporting."""
        with self._lock:
            stats = (
                self._workspace_stats.get(workspace, CacheStats())
                if workspace
                else self._global_stats
            )
            return {
                "prompt_tokens_total": stats.total_prompt_tokens,
                "completion_tokens_total": stats.total_completion_tokens,
                "cache_hit_tokens": stats.cache_hit_tokens,
                "cache_miss_tokens": stats.cache_miss_tokens,
                "cache_hit_rate": round(stats.hit_rate * 100, 1),
                "tokens_saved": stats.tokens_saved,
                "llm_calls": stats.llm_calls,
                "last_updated": stats.last_updated,
            }

    @staticmethod
    def stabilize_messages(messages: list[dict], max_tokens: int) -> list[dict]:
        """Compress messages while preserving the prefix for optimal caching.

        Unlike compress_history() which removes middle messages (breaking the
        prefix for DeepSeek's disk cache), this method keeps the beginning intact
        and summarizes the middle into a single injected context message.

        Strategy for DeepSeek::

            ``[system] [user1] [assistant1] [user2] [assistant2] ... [userN]``
            ``└────── PREFIX (cacheable) ──────┘└── middle ──┘└ recent ─┘``

        We keep: system + first 2 turns (prefix) + last 4 turns (recent)
        We summarize middle turns into a single system-injected context note.
        """
        from core.context_manager import ContextManager

        if not messages or len(messages) <= 6:
            return ContextManager.compress_history(messages, max_tokens)

        system = messages[0] if messages[0].get("role") == "system" else None
        offset = 1 if system else 0

        if len(messages) <= offset + 8:
            return ContextManager.compress_history(messages, max_tokens)

        prefix_count = min(3, len(messages) - offset - 4)
        recent_count = min(6, len(messages) - offset - prefix_count)

        prefix = messages[offset : offset + prefix_count]
        recent = messages[-(recent_count):]
        middle = (
            messages[offset + prefix_count : -recent_count]
            if recent_count
            else messages[offset + prefix_count :]
        )

        # Summarize middle
        summary_text = ContextManager.build_context_summary(
            list(middle), max_tokens=min(500, max_tokens // 4)
        )

        result = [system] if system else []
        result.extend(prefix)

        if summary_text:
            result.append(
                {
                    "role": "system",
                    "content": f"[Earlier context summary]\n{summary_text}",
                }
            )

        result.extend(recent)

        # Safety: if still too large, fall back to standard compression
        est = ContextManager.estimate_tokens(result)
        if est > max_tokens:
            return ContextManager.compress_history(messages, max_tokens)

        return result

Functions¶

track_usage ¶

track_usage(
    prompt_tokens: int = 0,
    completion_tokens: int = 0,
    prompt_cache_hit_tokens: int = 0,
    prompt_cache_miss_tokens: int = 0,
    workspace: str = "main",
) -> None

Record token usage and cache metrics from an LLM response.

Source code in core/cache_manager.py

def track_usage(
    self,
    prompt_tokens: int = 0,
    completion_tokens: int = 0,
    prompt_cache_hit_tokens: int = 0,
    prompt_cache_miss_tokens: int = 0,
    workspace: str = "main",
) -> None:
    """Record token usage and cache metrics from an LLM response."""
    with self._lock:
        # Global stats
        self._global_stats.total_prompt_tokens += prompt_tokens
        self._global_stats.cache_hit_tokens += prompt_cache_hit_tokens
        self._global_stats.cache_miss_tokens += prompt_cache_miss_tokens
        self._global_stats.total_completion_tokens += completion_tokens
        self._global_stats.llm_calls += 1
        self._global_stats.last_updated = time.time()

        # Per-workspace stats
        ws = self._workspace_stats.setdefault(workspace, CacheStats())
        ws.total_prompt_tokens += prompt_tokens
        ws.cache_hit_tokens += prompt_cache_hit_tokens
        ws.cache_miss_tokens += prompt_cache_miss_tokens
        ws.total_completion_tokens += completion_tokens
        ws.llm_calls += 1
        ws.last_updated = time.time()

        if prompt_cache_hit_tokens > 0 or prompt_cache_miss_tokens > 0:
            hit_rate = (
                prompt_cache_hit_tokens
                / (prompt_cache_hit_tokens + prompt_cache_miss_tokens)
                * 100
            )
            logger.debug(
                f"DeepSeek cache: {prompt_cache_hit_tokens} hit / "
                f"{prompt_cache_miss_tokens} miss "
                f"({hit_rate:.0f}% hit rate)"
            )

get_stats ¶

get_stats(workspace: str | None = None) -> dict[str, Any]

Return cache statistics as a dict for reporting.

Source code in core/cache_manager.py

def get_stats(self, workspace: str | None = None) -> dict[str, Any]:
    """Return cache statistics as a dict for reporting."""
    with self._lock:
        stats = (
            self._workspace_stats.get(workspace, CacheStats())
            if workspace
            else self._global_stats
        )
        return {
            "prompt_tokens_total": stats.total_prompt_tokens,
            "completion_tokens_total": stats.total_completion_tokens,
            "cache_hit_tokens": stats.cache_hit_tokens,
            "cache_miss_tokens": stats.cache_miss_tokens,
            "cache_hit_rate": round(stats.hit_rate * 100, 1),
            "tokens_saved": stats.tokens_saved,
            "llm_calls": stats.llm_calls,
            "last_updated": stats.last_updated,
        }

stabilize_messages `staticmethod` ¶

stabilize_messages(
    messages: list[dict], max_tokens: int
) -> list[dict]

Compress messages while preserving the prefix for optimal caching.

Unlike compress_history() which removes middle messages (breaking the prefix for DeepSeek's disk cache), this method keeps the beginning intact and summarizes the middle into a single injected context message.

Strategy for DeepSeek::

``[system] [user1] [assistant1] [user2] [assistant2] ... [userN]``
``└────── PREFIX (cacheable) ──────┘└── middle ──┘└ recent ─┘``

We keep: system + first 2 turns (prefix) + last 4 turns (recent) We summarize middle turns into a single system-injected context note.

Source code in core/cache_manager.py

@staticmethod
def stabilize_messages(messages: list[dict], max_tokens: int) -> list[dict]:
    """Compress messages while preserving the prefix for optimal caching.

    Unlike compress_history() which removes middle messages (breaking the
    prefix for DeepSeek's disk cache), this method keeps the beginning intact
    and summarizes the middle into a single injected context message.

    Strategy for DeepSeek::

        ``[system] [user1] [assistant1] [user2] [assistant2] ... [userN]``
        ``└────── PREFIX (cacheable) ──────┘└── middle ──┘└ recent ─┘``

    We keep: system + first 2 turns (prefix) + last 4 turns (recent)
    We summarize middle turns into a single system-injected context note.
    """
    from core.context_manager import ContextManager

    if not messages or len(messages) <= 6:
        return ContextManager.compress_history(messages, max_tokens)

    system = messages[0] if messages[0].get("role") == "system" else None
    offset = 1 if system else 0

    if len(messages) <= offset + 8:
        return ContextManager.compress_history(messages, max_tokens)

    prefix_count = min(3, len(messages) - offset - 4)
    recent_count = min(6, len(messages) - offset - prefix_count)

    prefix = messages[offset : offset + prefix_count]
    recent = messages[-(recent_count):]
    middle = (
        messages[offset + prefix_count : -recent_count]
        if recent_count
        else messages[offset + prefix_count :]
    )

    # Summarize middle
    summary_text = ContextManager.build_context_summary(
        list(middle), max_tokens=min(500, max_tokens // 4)
    )

    result = [system] if system else []
    result.extend(prefix)

    if summary_text:
        result.append(
            {
                "role": "system",
                "content": f"[Earlier context summary]\n{summary_text}",
            }
        )

    result.extend(recent)

    # Safety: if still too large, fall back to standard compression
    est = ContextManager.estimate_tokens(result)
    if est > max_tokens:
        return ContextManager.compress_history(messages, max_tokens)

    return result

core.context_manager ¶

Context Manager — gestión inteligente de ventana de contexto para LLMs.

Classes¶

ContextManager ¶

Gestión de ventana de contexto: estimación de tokens, compresión, chunking.

Source code in core/context_manager.py

class ContextManager:
    """Gestión de ventana de contexto: estimación de tokens, compresión, chunking."""

    # Approximation: ~4 chars per token for English, ~3 for Spanish/code
    CHARS_PER_TOKEN = 3.5

    @classmethod
    def _max_tokens(cls) -> int:
        from core.config import settings

        return settings.max_context_tokens

    @classmethod
    def estimate_tokens(cls, messages: list[dict]) -> int:
        """Estima el número de tokens en una lista de mensajes."""
        total: float = 0.0
        for msg in messages:
            content = msg.get("content", "")
            if content is None:
                content = ""
            total += len(str(content)) / cls.CHARS_PER_TOKEN
            # Add per-message overhead (~4 tokens)
            total += 4
        return int(total)

    @classmethod
    def compress_history(cls, messages: list[dict], max_tokens: int = 8000) -> list[dict]:
        """Comprime el historial manteniendo system prompt y últimos mensajes."""
        if not messages:
            return []

        system = messages[0] if messages and messages[0].get("role") == "system" else None
        rest = messages[1:] if system else messages

        # Mantener system prompt
        result = [system] if system else []

        # Take recent messages until budget is filled
        taken: list = []
        used = cls.estimate_tokens(result)
        for msg in reversed(rest):
            msg_tokens = cls.estimate_tokens([msg])
            if used + msg_tokens > max_tokens:
                break
            taken.insert(0, msg)
            used += msg_tokens

        return result + taken

    @classmethod
    def chunk_large_file(cls, content: str, file_path: str, chunk_size: int = 2000) -> list[dict]:
        """Divide archivos grandes en chunks solapados con metadatos."""
        lines = content.splitlines(keepends=True)
        if not lines:
            return []

        chunks = []
        start_line = 0
        chunk_idx = 0

        while start_line < len(lines):
            chunk_lines: list = []
            current_len = 0
            end_line = start_line

            for i in range(start_line, len(lines)):
                if current_len + len(lines[i]) > chunk_size and chunk_lines:
                    break
                chunk_lines.append(lines[i])
                current_len += len(lines[i])
                end_line = i + 1

            chunk_text = "".join(chunk_lines)
            chunks.append(
                {
                    "file": file_path,
                    "chunk_index": chunk_idx,
                    "start_line": start_line + 1,
                    "end_line": end_line,
                    "content": chunk_text,
                    "size": len(chunk_text),
                }
            )

            start_line = end_line
            chunk_idx += 1

            # Overlap: last line of previous chunk starts the next
            if end_line < len(lines):
                start_line = max(start_line - 1, 0)

        return chunks

    @classmethod
    def summarize_for_context(cls, text: str, max_chars: int = 500) -> str:
        """Resume un texto para incluirlo en contexto limitado."""
        if len(text) <= max_chars:
            return text
        return text[: max_chars - 3] + "..."

    @classmethod
    def build_context_summary(cls, messages: list[dict], max_tokens: int = 2000) -> str:
        """Construye un resumen del historial para inyectar en nuevo contexto."""
        if not messages:
            return ""
        parts = []
        for msg in messages[-10:]:
            content = msg.get("content", "")
            if content:
                role = msg.get("role", "?")
                parts.append(f"[{role}]: {cls.summarize_for_context(str(content), 200)}")
        return "\n".join(parts)

Functions¶

estimate_tokens `classmethod` ¶

estimate_tokens(messages: list[dict]) -> int

Estima el número de tokens en una lista de mensajes.

Source code in core/context_manager.py

@classmethod
def estimate_tokens(cls, messages: list[dict]) -> int:
    """Estima el número de tokens en una lista de mensajes."""
    total: float = 0.0
    for msg in messages:
        content = msg.get("content", "")
        if content is None:
            content = ""
        total += len(str(content)) / cls.CHARS_PER_TOKEN
        # Add per-message overhead (~4 tokens)
        total += 4
    return int(total)

compress_history `classmethod` ¶

compress_history(
    messages: list[dict], max_tokens: int = 8000
) -> list[dict]

Comprime el historial manteniendo system prompt y últimos mensajes.

Source code in core/context_manager.py

@classmethod
def compress_history(cls, messages: list[dict], max_tokens: int = 8000) -> list[dict]:
    """Comprime el historial manteniendo system prompt y últimos mensajes."""
    if not messages:
        return []

    system = messages[0] if messages and messages[0].get("role") == "system" else None
    rest = messages[1:] if system else messages

    # Mantener system prompt
    result = [system] if system else []

    # Take recent messages until budget is filled
    taken: list = []
    used = cls.estimate_tokens(result)
    for msg in reversed(rest):
        msg_tokens = cls.estimate_tokens([msg])
        if used + msg_tokens > max_tokens:
            break
        taken.insert(0, msg)
        used += msg_tokens

    return result + taken

chunk_large_file `classmethod` ¶

chunk_large_file(
    content: str, file_path: str, chunk_size: int = 2000
) -> list[dict]

Divide archivos grandes en chunks solapados con metadatos.

Source code in core/context_manager.py

@classmethod
def chunk_large_file(cls, content: str, file_path: str, chunk_size: int = 2000) -> list[dict]:
    """Divide archivos grandes en chunks solapados con metadatos."""
    lines = content.splitlines(keepends=True)
    if not lines:
        return []

    chunks = []
    start_line = 0
    chunk_idx = 0

    while start_line < len(lines):
        chunk_lines: list = []
        current_len = 0
        end_line = start_line

        for i in range(start_line, len(lines)):
            if current_len + len(lines[i]) > chunk_size and chunk_lines:
                break
            chunk_lines.append(lines[i])
            current_len += len(lines[i])
            end_line = i + 1

        chunk_text = "".join(chunk_lines)
        chunks.append(
            {
                "file": file_path,
                "chunk_index": chunk_idx,
                "start_line": start_line + 1,
                "end_line": end_line,
                "content": chunk_text,
                "size": len(chunk_text),
            }
        )

        start_line = end_line
        chunk_idx += 1

        # Overlap: last line of previous chunk starts the next
        if end_line < len(lines):
            start_line = max(start_line - 1, 0)

    return chunks

summarize_for_context `classmethod` ¶

summarize_for_context(
    text: str, max_chars: int = 500
) -> str

Resume un texto para incluirlo en contexto limitado.

Source code in core/context_manager.py

@classmethod
def summarize_for_context(cls, text: str, max_chars: int = 500) -> str:
    """Resume un texto para incluirlo en contexto limitado."""
    if len(text) <= max_chars:
        return text
    return text[: max_chars - 3] + "..."

build_context_summary `classmethod` ¶

build_context_summary(
    messages: list[dict], max_tokens: int = 2000
) -> str

Construye un resumen del historial para inyectar en nuevo contexto.

Source code in core/context_manager.py

@classmethod
def build_context_summary(cls, messages: list[dict], max_tokens: int = 2000) -> str:
    """Construye un resumen del historial para inyectar en nuevo contexto."""
    if not messages:
        return ""
    parts = []
    for msg in messages[-10:]:
        content = msg.get("content", "")
        if content:
            role = msg.get("role", "?")
            parts.append(f"[{role}]: {cls.summarize_for_context(str(content), 200)}")
    return "\n".join(parts)

core.change_tracker ¶

Change Tracker — undo/redo de cambios de archivos.

Antes de cada file_manager.write, guarda una copia de respaldo. El usuario puede revertir cambios con el comando 'undo'.

Classes¶

ChangeTracker ¶

Registra cambios de archivos para permitir undo.

Source code in core/change_tracker.py

class ChangeTracker:
    """Registra cambios de archivos para permitir undo."""

    def __init__(self, workspace: str = "main", project_root: str | None = None):
        self.workspace = workspace
        self.project_root = project_root
        self._undo_dir = paths.memory_dir(workspace) / ".undo"
        self._redo_dir = paths.memory_dir(workspace) / ".redo"
        self._undo_dir.mkdir(parents=True, exist_ok=True)
        self._redo_dir.mkdir(parents=True, exist_ok=True)

    def save_before_write(self, file_path: str) -> str | None:
        """Guarda el contenido actual antes de sobrescribir. Retorna el key de undo."""
        full_path = self._resolve(file_path)
        if not full_path.exists():
            return None

        timestamp = int(time.time() * 1000)
        safe_name = _encode_path(file_path)
        backup_path = self._undo_dir / f"{timestamp}_{safe_name}"

        try:
            content = full_path.read_text(encoding="utf-8")
            backup_path.write_text(content, encoding="utf-8")
            logger.info(f"Backup guardado: {backup_path.name}")

            # Clean up old backups (more than 100)
            backups = sorted(self._undo_dir.glob("*"))
            for old in backups[:-100]:
                old.unlink()

            return backup_path.name
        except Exception as e:
            logger.error(f"Error guardando backup: {e}")
            return None

    def undo_last(self) -> str | None:
        """Undo the last change. Returns the restored file path."""
        backups = sorted(self._undo_dir.glob("*"))
        if not backups:
            return None

        last_backup = backups[-1]
        name = last_backup.name
        if "_" not in name:
            logger.warning("Backup con nombre inválido (sin '_'): %s", name)
            return None
        original_path = _decode_path(name.split("_", 1)[1])

        try:
            # Mover archivo actual a redo
            current = self._resolve(original_path)
            if current.exists() and "_" in name:
                parts = name.split("_", 1)
                if len(parts) >= 2:
                    redo_backup = self._redo_dir / f"{int(time.time() * 1000)}_{parts[1]}"
                    redo_backup.write_text(current.read_text(encoding="utf-8"))

            # Restore backup
            current.write_text(last_backup.read_text(encoding="utf-8"))
            last_backup.unlink()
            logger.info(f"Undo aplicado: {original_path}")
            return original_path
        except Exception as e:
            logger.error(f"Error en undo: {e}")
            return None

    def redo_last(self) -> str | None:
        """Re-apply the last undone change."""
        redos = sorted(self._redo_dir.glob("*"))
        if not redos:
            return None

        last_redo = redos[-1]
        name = last_redo.name
        if "_" not in name:
            logger.warning("Redo con nombre inválido (sin '_'): %s", name)
            return None
        original_path = _decode_path(name.split("_", 1)[1])

        try:
            current = self._resolve(original_path)
            current.write_text(last_redo.read_text(encoding="utf-8"))
            last_redo.unlink()
            logger.info(f"Redo aplicado: {original_path}")
            return original_path
        except Exception as e:
            logger.error(f"Error en redo: {e}")
            return None

    def list_undo_stack(self) -> list[str]:
        """Lista los backups disponibles para undo."""
        backups = sorted(self._undo_dir.glob("*"))
        result = []
        for b in backups:
            name = b.name
            original = _decode_path(name.split("_", 1)[1]) if "_" in name else name
            ts = int(name.split("_")[0]) / 1000 if name[0].isdigit() else 0
            result.append(f"{original} ({time.ctime(ts)})")
        return result

    def _resolve(self, file_path: str) -> Path:
        base = paths.memory_dir(self.workspace)
        if self.project_root:
            base = base / self.project_root
        return base / file_path

Functions¶

save_before_write ¶

save_before_write(file_path: str) -> str | None

Guarda el contenido actual antes de sobrescribir. Retorna el key de undo.

Source code in core/change_tracker.py

def save_before_write(self, file_path: str) -> str | None:
    """Guarda el contenido actual antes de sobrescribir. Retorna el key de undo."""
    full_path = self._resolve(file_path)
    if not full_path.exists():
        return None

    timestamp = int(time.time() * 1000)
    safe_name = _encode_path(file_path)
    backup_path = self._undo_dir / f"{timestamp}_{safe_name}"

    try:
        content = full_path.read_text(encoding="utf-8")
        backup_path.write_text(content, encoding="utf-8")
        logger.info(f"Backup guardado: {backup_path.name}")

        # Clean up old backups (more than 100)
        backups = sorted(self._undo_dir.glob("*"))
        for old in backups[:-100]:
            old.unlink()

        return backup_path.name
    except Exception as e:
        logger.error(f"Error guardando backup: {e}")
        return None

undo_last ¶

undo_last() -> str | None

Undo the last change. Returns the restored file path.

Source code in core/change_tracker.py

def undo_last(self) -> str | None:
    """Undo the last change. Returns the restored file path."""
    backups = sorted(self._undo_dir.glob("*"))
    if not backups:
        return None

    last_backup = backups[-1]
    name = last_backup.name
    if "_" not in name:
        logger.warning("Backup con nombre inválido (sin '_'): %s", name)
        return None
    original_path = _decode_path(name.split("_", 1)[1])

    try:
        # Mover archivo actual a redo
        current = self._resolve(original_path)
        if current.exists() and "_" in name:
            parts = name.split("_", 1)
            if len(parts) >= 2:
                redo_backup = self._redo_dir / f"{int(time.time() * 1000)}_{parts[1]}"
                redo_backup.write_text(current.read_text(encoding="utf-8"))

        # Restore backup
        current.write_text(last_backup.read_text(encoding="utf-8"))
        last_backup.unlink()
        logger.info(f"Undo aplicado: {original_path}")
        return original_path
    except Exception as e:
        logger.error(f"Error en undo: {e}")
        return None

redo_last ¶

redo_last() -> str | None

Re-apply the last undone change.

Source code in core/change_tracker.py

def redo_last(self) -> str | None:
    """Re-apply the last undone change."""
    redos = sorted(self._redo_dir.glob("*"))
    if not redos:
        return None

    last_redo = redos[-1]
    name = last_redo.name
    if "_" not in name:
        logger.warning("Redo con nombre inválido (sin '_'): %s", name)
        return None
    original_path = _decode_path(name.split("_", 1)[1])

    try:
        current = self._resolve(original_path)
        current.write_text(last_redo.read_text(encoding="utf-8"))
        last_redo.unlink()
        logger.info(f"Redo aplicado: {original_path}")
        return original_path
    except Exception as e:
        logger.error(f"Error en redo: {e}")
        return None

list_undo_stack ¶

list_undo_stack() -> list[str]

Lista los backups disponibles para undo.

Source code in core/change_tracker.py

def list_undo_stack(self) -> list[str]:
    """Lista los backups disponibles para undo."""
    backups = sorted(self._undo_dir.glob("*"))
    result = []
    for b in backups:
        name = b.name
        original = _decode_path(name.split("_", 1)[1]) if "_" in name else name
        ts = int(name.split("_")[0]) / 1000 if name[0].isdigit() else 0
        result.append(f"{original} ({time.ctime(ts)})")
    return result

core.codebase_indexer ¶

Codebase Indexer — indexación semántica con FAISS + cache en disco.

Classes¶

CodebaseIndexer ¶

Indexa un codebase con FAISS para búsqueda semántica de código relevante.

Source code in core/codebase_indexer.py

class CodebaseIndexer:
    """Indexa un codebase con FAISS para búsqueda semántica de código relevante."""

    def __init__(self, workspace: str = "main", project_root: str | None = None):
        self.workspace = workspace
        self.project_root = project_root
        self._index_built = False
        self._file_hashes: dict[str, str] = {}

        cache_dir = self._cache_dir()
        try:
            self.indexer = FAISSIndexer.load(cache_dir)
            self._index_built = self.indexer.index.ntotal > 0
            logger.info(
                f"Loaded cached FAISS index from {cache_dir} ({self.indexer.document_count} docs)"
            )
        except FileNotFoundError:
            self.indexer = FAISSIndexer()

    def _resolve_base(self) -> Path:
        base = paths.memory_dir(self.workspace)
        if self.project_root:
            base = base / self.project_root
        return base

    def _cache_dir(self) -> Path:
        cache_dir = paths.memory_dir(self.workspace) / ".codebase_cache"
        if self.project_root:
            project_name = Path(self.project_root).name
            cache_dir = cache_dir / project_name
        return cache_dir

    def _load_cache(self) -> dict[str, str]:
        cache_path = self._cache_dir() / CACHE_FILE
        if cache_path.exists():
            try:
                return json.loads(cache_path.read_text())
            except Exception:
                logger.debug("Error leyendo caché en _load_cache", exc_info=True)
        return {}

    def _save_cache(self) -> None:
        cache_path = self._cache_dir() / CACHE_FILE
        cache_path.parent.mkdir(parents=True, exist_ok=True)
        try:
            cache_path.write_text(json.dumps(self._file_hashes, indent=2))
        except Exception:
            logger.debug("Error guardando caché de codebase", exc_info=True)

    def _hash_file(self, file_path: Path) -> str:
        """Hash rápido basado en mtime + tamaño."""
        stat = file_path.stat()
        return hashlib.md5(f"{stat.st_mtime}:{stat.st_size}".encode()).hexdigest()[:12]

    def index_project(
        self,
        patterns: list[str] | None = None,
        max_files: int = MAX_FILES,
        force: bool = False,
        progress_callback: Callable[[dict], None] | None = None,
    ) -> int:
        """Indexa archivos incrementalmente (solo archivos modificados desde último index).

        Args:
            patterns: Extensiones a indexar (None = CODE_EXTENSIONS).
            max_files: Máximo de archivos a indexar.
            force: Si True, reindexa todo ignorando cache.
            progress_callback: Callable(dict) para reportar progreso.

        Returns:
            Número de chunks indexados en esta ejecución.
        """
        base = self._resolve_base()
        if not base.exists():
            logger.debug("Directorio de proyecto no encontrado: %s", base)
            return 0

        # Skip if cache already loaded and not forced
        if not force and self._index_built and self.indexer.document_count > 0:
            logger.info("Using cached FAISS index, skipping re-index")
            return 0

        self._file_hashes = self._load_cache()
        total_chunks = 0
        files_processed = 0

        extensions = patterns if patterns else CODE_EXTENSIONS

        # Rough total estimate for progress
        total_estimate = min(max_files, sum(1 for _ in base.rglob("*") if _.is_file()))

        # Batch indexing: accumulate all chunks first, rebuild once at the end
        pending_chunks: list[tuple[str, object]] = []

        for ext in extensions:
            pattern = f"**/*{ext}" if ext.startswith(".") else f"**/*.{ext}"
            for f in base.glob(pattern):
                if files_processed >= max_files:
                    break
                if not f.is_file():
                    continue
                if any(
                    p in f.parts
                    for p in (".git", "__pycache__", "node_modules", ".venv", ".undo", ".redo")
                ):
                    continue
                if f.stat().st_size > MAX_FILE_SIZE:
                    continue

                rel_path = str(f.relative_to(base))
                current_hash = self._hash_file(f)

                if not force and self._file_hashes.get(rel_path) == current_hash:
                    files_processed += 1
                    continue

                try:
                    content = f.read_text(encoding="utf-8", errors="replace")
                except Exception:
                    files_processed += 1
                    continue

                chunks = ContextManager.chunk_large_file(content, rel_path)
                for chunk in chunks:
                    pending_chunks.append(
                        (
                            f"{chunk['file']}:L{chunk['start_line']}",
                            chunk,
                        )
                    )
                    total_chunks += 1

                self.indexer.remove(rel_path)
                self._file_hashes[rel_path] = current_hash
                files_processed += 1

                # Progress reporting
                if progress_callback and files_processed % 5 == 0:
                    try:
                        progress_callback(
                            {
                                "phase": "indexing",
                                "current_file": rel_path,
                                "files_scanned": files_processed,
                                "total_chunks": total_chunks,
                                "pct": min(99, int(files_processed / max(1, total_estimate) * 100)),
                            }
                        )
                    except Exception:
                        pass

        # Single rebuild with all new chunks at once
        if pending_chunks:
            self.indexer.rebuild_index()
            for key, value in pending_chunks:
                self.indexer.add(key=key, value=value)

        self._index_built = self.indexer.index.ntotal > 0
        self._save_cache()

        # Persist FAISS index to disk
        if self._index_built:
            try:
                self.indexer.save(self._cache_dir())
            except Exception as e:
                logger.warning(f"Failed to save FAISS index: {e}")

        logger.info(f"Codebase indexado: {files_processed} archivos, {total_chunks} chunks nuevos")
        return total_chunks

    def search(self, query: str, k: int = 10) -> list[dict]:
        if not self._index_built:
            return []
        return self.indexer.search(query, k=k)

    def find_relevant_code(self, task: str, max_results: int = 5) -> str:
        results = self.search(task, k=max_results)
        if not results:
            return ""
        parts = []
        for r in results:
            key = r["key"]
            chunk = r["value"]
            if isinstance(chunk, dict):
                file_name = chunk.get("file", key)
                content = chunk.get("content", str(chunk))[:1000]
                start = chunk.get("start_line", "?")
                parts.append(f"// {file_name}:{start}\n{content}")
            else:
                parts.append(f"// {key}\n{str(chunk)[:1000]}")
        return "\n\n".join(parts)

Functions¶

index_project ¶

index_project(
    patterns: list[str] | None = None,
    max_files: int = MAX_FILES,
    force: bool = False,
    progress_callback: Callable[[dict], None] | None = None,
) -> int

Indexa archivos incrementalmente (solo archivos modificados desde último index).

Parameters:

Name	Type	Description	Default
`patterns`	`list[str] \| None`	Extensiones a indexar (None = CODE_EXTENSIONS).	`None`
`max_files`	`int`	Máximo de archivos a indexar.	`MAX_FILES`
`force`	`bool`	Si True, reindexa todo ignorando cache.	`False`
`progress_callback`	`Callable[[dict], None] \| None`	Callable(dict) para reportar progreso.	`None`

Returns:

Type	Description
`int`	Número de chunks indexados en esta ejecución.

Source code in core/codebase_indexer.py

def index_project(
    self,
    patterns: list[str] | None = None,
    max_files: int = MAX_FILES,
    force: bool = False,
    progress_callback: Callable[[dict], None] | None = None,
) -> int:
    """Indexa archivos incrementalmente (solo archivos modificados desde último index).

    Args:
        patterns: Extensiones a indexar (None = CODE_EXTENSIONS).
        max_files: Máximo de archivos a indexar.
        force: Si True, reindexa todo ignorando cache.
        progress_callback: Callable(dict) para reportar progreso.

    Returns:
        Número de chunks indexados en esta ejecución.
    """
    base = self._resolve_base()
    if not base.exists():
        logger.debug("Directorio de proyecto no encontrado: %s", base)
        return 0

    # Skip if cache already loaded and not forced
    if not force and self._index_built and self.indexer.document_count > 0:
        logger.info("Using cached FAISS index, skipping re-index")
        return 0

    self._file_hashes = self._load_cache()
    total_chunks = 0
    files_processed = 0

    extensions = patterns if patterns else CODE_EXTENSIONS

    # Rough total estimate for progress
    total_estimate = min(max_files, sum(1 for _ in base.rglob("*") if _.is_file()))

    # Batch indexing: accumulate all chunks first, rebuild once at the end
    pending_chunks: list[tuple[str, object]] = []

    for ext in extensions:
        pattern = f"**/*{ext}" if ext.startswith(".") else f"**/*.{ext}"
        for f in base.glob(pattern):
            if files_processed >= max_files:
                break
            if not f.is_file():
                continue
            if any(
                p in f.parts
                for p in (".git", "__pycache__", "node_modules", ".venv", ".undo", ".redo")
            ):
                continue
            if f.stat().st_size > MAX_FILE_SIZE:
                continue

            rel_path = str(f.relative_to(base))
            current_hash = self._hash_file(f)

            if not force and self._file_hashes.get(rel_path) == current_hash:
                files_processed += 1
                continue

            try:
                content = f.read_text(encoding="utf-8", errors="replace")
            except Exception:
                files_processed += 1
                continue

            chunks = ContextManager.chunk_large_file(content, rel_path)
            for chunk in chunks:
                pending_chunks.append(
                    (
                        f"{chunk['file']}:L{chunk['start_line']}",
                        chunk,
                    )
                )
                total_chunks += 1

            self.indexer.remove(rel_path)
            self._file_hashes[rel_path] = current_hash
            files_processed += 1

            # Progress reporting
            if progress_callback and files_processed % 5 == 0:
                try:
                    progress_callback(
                        {
                            "phase": "indexing",
                            "current_file": rel_path,
                            "files_scanned": files_processed,
                            "total_chunks": total_chunks,
                            "pct": min(99, int(files_processed / max(1, total_estimate) * 100)),
                        }
                    )
                except Exception:
                    pass

    # Single rebuild with all new chunks at once
    if pending_chunks:
        self.indexer.rebuild_index()
        for key, value in pending_chunks:
            self.indexer.add(key=key, value=value)

    self._index_built = self.indexer.index.ntotal > 0
    self._save_cache()

    # Persist FAISS index to disk
    if self._index_built:
        try:
            self.indexer.save(self._cache_dir())
        except Exception as e:
            logger.warning(f"Failed to save FAISS index: {e}")

    logger.info(f"Codebase indexado: {files_processed} archivos, {total_chunks} chunks nuevos")
    return total_chunks

core.embedding_provider ¶

Classes¶

EmbeddingProvider ¶

Provider lazy de embeddings — carga en background sin bloquear arranque.

Source code in core/embedding_provider.py

class EmbeddingProvider:
    """Provider lazy de embeddings — carga en background sin bloquear arranque."""

    _model_name = "intfloat/multilingual-e5-large"
    _model = None
    _loading = False
    _ready = threading.Event()
    _lock = threading.Lock()

    @classmethod
    def get_instance(cls):
        """Retorna el modelo si está listo. Si no, inicia carga en background.
        Retorna None hasta que el modelo esté completamente cargado.
        """
        if cls._model is not None:
            return cls._model

        with cls._lock:
            if cls._model is not None:
                return cls._model
            if not cls._loading:
                cls._loading = True
                logger.info(f"Iniciando carga en background: {cls._model_name}")
                t = threading.Thread(target=cls._load_model, daemon=True)
                t.start()

        return None

    @classmethod
    def encode(cls, text: str):
        """Wrapper con fallback: si el modelo no está listo, retorna None."""
        model = cls.get_instance()
        if model is None:
            return None
        return model.encode(text)

    @classmethod
    def wait_until_ready(cls, timeout: float = 60) -> bool:
        """Espera hasta que el modelo esté cargado. Retorna True si listo."""
        cls.get_instance()  # starts loading if not active
        return cls._ready.wait(timeout)

    @classmethod
    def _load_model(cls):
        try:
            from sentence_transformers import SentenceTransformer

            logger.info(f"Cargando modelo de embeddings: {cls._model_name}")
            cls._model = SentenceTransformer(cls._model_name)
            logger.info("Modelo de embeddings cargado correctamente.")
            cls._ready.set()
        except Exception as e:
            logger.error(f"Error cargando modelo embeddings: {e}")

Functions¶

get_instance `classmethod` ¶

get_instance()

Retorna el modelo si está listo. Si no, inicia carga en background. Retorna None hasta que el modelo esté completamente cargado.

Source code in core/embedding_provider.py

@classmethod
def get_instance(cls):
    """Retorna el modelo si está listo. Si no, inicia carga en background.
    Retorna None hasta que el modelo esté completamente cargado.
    """
    if cls._model is not None:
        return cls._model

    with cls._lock:
        if cls._model is not None:
            return cls._model
        if not cls._loading:
            cls._loading = True
            logger.info(f"Iniciando carga en background: {cls._model_name}")
            t = threading.Thread(target=cls._load_model, daemon=True)
            t.start()

    return None

encode `classmethod` ¶

encode(text: str)

Wrapper con fallback: si el modelo no está listo, retorna None.

Source code in core/embedding_provider.py

@classmethod
def encode(cls, text: str):
    """Wrapper con fallback: si el modelo no está listo, retorna None."""
    model = cls.get_instance()
    if model is None:
        return None
    return model.encode(text)

wait_until_ready `classmethod` ¶

wait_until_ready(timeout: float = 60) -> bool

Espera hasta que el modelo esté cargado. Retorna True si listo.

Source code in core/embedding_provider.py

@classmethod
def wait_until_ready(cls, timeout: float = 60) -> bool:
    """Espera hasta que el modelo esté cargado. Retorna True si listo."""
    cls.get_instance()  # starts loading if not active
    return cls._ready.wait(timeout)

core.faiss_indexer ¶

FAISS Indexer — indexación semántica reutilizable con FAISS + SentenceTransformer.

Classes¶

FAISSIndexer ¶

Indexación FAISS reutilizable: add, search, save, load, rebuild.

Source code in core/faiss_indexer.py

class FAISSIndexer:
    """Indexación FAISS reutilizable: add, search, save, load, rebuild."""

    def __init__(self, dimension: int = FAISS_DIMENSION, embedder=None):
        self._lock = threading.RLock()
        self.index = faiss.IndexFlatL2(dimension)
        self.documents: list[tuple[str, object]] = []
        self.embedder = embedder or EmbeddingProvider
        if not embedder:
            self.embedder.get_instance()

    def _encode(self, text: str):
        if self.embedder.wait_until_ready(timeout=60):
            return self.embedder.encode(text)
        logger.warning("Modelo embeddings no disponible")
        return None

    def add(self, key: str, value: object) -> None:
        """Añade un documento al índice."""
        embedding = self._encode(str(value))
        if embedding is None:
            return
        with self._lock:
            self.index.add(embedding.reshape(1, -1))
            self.documents.append((key, value))

    def search(self, query: str, k: int = 5) -> list[dict]:
        """Búsqueda semántica. Retorna [{key, value, distance, similarity}]."""
        query_emb = self._encode(query)
        if query_emb is None:
            return []
        query_emb = query_emb.reshape(1, -1)
        with self._lock:
            if self.index.ntotal == 0:
                return []
            distances, indices = self.index.search(query_emb, min(k, self.index.ntotal))
        results = []
        with self._lock:
            for dist, idx in zip(distances[0], indices[0], strict=False):
                if idx >= 0 and idx < len(self.documents):
                    key, value = self.documents[idx]
                    similarity = 1.0 / (1.0 + float(dist))
                    results.append(
                        {
                            "key": key,
                            "value": value,
                            "distance": float(dist),
                            "similarity": float(similarity),
                        }
                    )
        return results

    def remove(self, key: str) -> None:
        """Elimina un documento del índice (requiere rebuild)."""
        with self._lock:
            self.documents = [(k, v) for k, v in self.documents if k != key]

    def rebuild_index(self) -> None:
        """Reconstruye el índice desde cero basado en documents."""
        with self._lock:
            doc_snapshot = list(self.documents)
        precomputed = []
        for _, value in doc_snapshot:
            emb = self._encode(str(value))
            if emb is not None:
                precomputed.append(emb)
        with self._lock:
            self.index = faiss.IndexFlatL2(self.index.d)
            for emb in precomputed:
                self.index.add(emb.reshape(1, -1))

    def clear(self) -> None:
        """Limpia documentos e índice."""
        with self._lock:
            self.documents = []
            self.index = faiss.IndexFlatL2(self.index.d)

    def save(self, directory: Path) -> None:
        """Persiste el índice FAISS y documentos a disco."""
        directory.mkdir(parents=True, exist_ok=True)
        with self._lock:
            faiss.write_index(self.index, str(directory / "faiss.index"))
            with open(directory / "documents.pkl", "wb") as f:
                pickle.dump(self.documents, f)
        logger.info(f"FAISS index saved to {directory} ({self.index.ntotal} vectors)")

    @classmethod
    def load(cls, directory: Path, dimension: int = FAISS_DIMENSION) -> "FAISSIndexer":
        """Carga un índice FAISS desde disco."""
        index_path = directory / "faiss.index"
        docs_path = directory / "documents.pkl"
        if not index_path.exists() or not docs_path.exists():
            raise FileNotFoundError(f"No cached FAISS index at {directory}")
        instance = cls(dimension=dimension)
        instance.index = faiss.read_index(str(index_path))
        with open(docs_path, "rb") as f:
            instance.documents = pickle.load(f)
        logger.info(f"FAISS index loaded from {directory} ({instance.index.ntotal} vectors)")
        return instance

    @property
    def document_count(self) -> int:
        return len(self.documents)

Functions¶

add ¶

add(key: str, value: object) -> None

Añade un documento al índice.

Source code in core/faiss_indexer.py

def add(self, key: str, value: object) -> None:
    """Añade un documento al índice."""
    embedding = self._encode(str(value))
    if embedding is None:
        return
    with self._lock:
        self.index.add(embedding.reshape(1, -1))
        self.documents.append((key, value))

search ¶

search(query: str, k: int = 5) -> list[dict]

Búsqueda semántica. Retorna [{key, value, distance, similarity}].

Source code in core/faiss_indexer.py

def search(self, query: str, k: int = 5) -> list[dict]:
    """Búsqueda semántica. Retorna [{key, value, distance, similarity}]."""
    query_emb = self._encode(query)
    if query_emb is None:
        return []
    query_emb = query_emb.reshape(1, -1)
    with self._lock:
        if self.index.ntotal == 0:
            return []
        distances, indices = self.index.search(query_emb, min(k, self.index.ntotal))
    results = []
    with self._lock:
        for dist, idx in zip(distances[0], indices[0], strict=False):
            if idx >= 0 and idx < len(self.documents):
                key, value = self.documents[idx]
                similarity = 1.0 / (1.0 + float(dist))
                results.append(
                    {
                        "key": key,
                        "value": value,
                        "distance": float(dist),
                        "similarity": float(similarity),
                    }
                )
    return results

remove ¶

remove(key: str) -> None

Elimina un documento del índice (requiere rebuild).

Source code in core/faiss_indexer.py

def remove(self, key: str) -> None:
    """Elimina un documento del índice (requiere rebuild)."""
    with self._lock:
        self.documents = [(k, v) for k, v in self.documents if k != key]

rebuild_index ¶

rebuild_index() -> None

Reconstruye el índice desde cero basado en documents.

Source code in core/faiss_indexer.py

def rebuild_index(self) -> None:
    """Reconstruye el índice desde cero basado en documents."""
    with self._lock:
        doc_snapshot = list(self.documents)
    precomputed = []
    for _, value in doc_snapshot:
        emb = self._encode(str(value))
        if emb is not None:
            precomputed.append(emb)
    with self._lock:
        self.index = faiss.IndexFlatL2(self.index.d)
        for emb in precomputed:
            self.index.add(emb.reshape(1, -1))

clear ¶

clear() -> None

Limpia documentos e índice.

Source code in core/faiss_indexer.py

def clear(self) -> None:
    """Limpia documentos e índice."""
    with self._lock:
        self.documents = []
        self.index = faiss.IndexFlatL2(self.index.d)

save ¶

save(directory: Path) -> None

Persiste el índice FAISS y documentos a disco.

Source code in core/faiss_indexer.py

def save(self, directory: Path) -> None:
    """Persiste el índice FAISS y documentos a disco."""
    directory.mkdir(parents=True, exist_ok=True)
    with self._lock:
        faiss.write_index(self.index, str(directory / "faiss.index"))
        with open(directory / "documents.pkl", "wb") as f:
            pickle.dump(self.documents, f)
    logger.info(f"FAISS index saved to {directory} ({self.index.ntotal} vectors)")

load `classmethod` ¶

load(
    directory: Path, dimension: int = FAISS_DIMENSION
) -> FAISSIndexer

Carga un índice FAISS desde disco.

Source code in core/faiss_indexer.py

@classmethod
def load(cls, directory: Path, dimension: int = FAISS_DIMENSION) -> "FAISSIndexer":
    """Carga un índice FAISS desde disco."""
    index_path = directory / "faiss.index"
    docs_path = directory / "documents.pkl"
    if not index_path.exists() or not docs_path.exists():
        raise FileNotFoundError(f"No cached FAISS index at {directory}")
    instance = cls(dimension=dimension)
    instance.index = faiss.read_index(str(index_path))
    with open(docs_path, "rb") as f:
        instance.documents = pickle.load(f)
    logger.info(f"FAISS index loaded from {directory} ({instance.index.ntotal} vectors)")
    return instance

core.git_operations ¶

Git Operations — helper centralizado para auto-commit y operaciones git comunes.

Smart commit: generates the commit message via LLM based on the task.

Functions¶

auto_commit `async` ¶

auto_commit(
    workspace: str,
    project_root: str | None = None,
    message: str = "Auto-commit: tarea completada",
) -> dict

Ejecuta git init, add -A, commit automático. Retorna {success, output}.

Source code in core/git_operations.py

async def auto_commit(
    workspace: str,
    project_root: str | None = None,
    message: str = "Auto-commit: tarea completada",
) -> dict:
    """Ejecuta git init, add -A, commit automático. Retorna {success, output}."""
    auto_params = {"workspace": workspace}
    if project_root:
        auto_params["project_root"] = project_root

    await safe_tool_call(
        tool_name="git_manager", parameters={"action": "init", **auto_params}, role="agent"
    )
    await safe_tool_call(
        tool_name="git_manager", parameters={"action": "add", **auto_params}, role="agent"
    )
    commit_res = await safe_tool_call(
        tool_name="git_manager",
        parameters={"action": "commit", "message": message, **auto_params},
        role="agent",
    )

    output = str(commit_res.get("output", "")) if isinstance(commit_res, dict) else str(commit_res)
    success = "Commit realizado" in output

    if success:
        logger.info("✅ Auto-commit: %s", message[:60])
    else:
        logger.warning("⚠️ Auto-commit fallido: %s", output[:200])

    return {"success": success, "output": output}

smart_auto_commit `async` ¶

smart_auto_commit(
    workspace: str,
    project_root: str | None = None,
    task_description: str = "",
    files_written: list[str] | None = None,
) -> dict

Commit automático con mensaje generado por LLM basado en la tarea.

Si task_description está vacío, usa el mensaje por defecto. Si hay LLM disponible, genera un resumen de una línea de los cambios.

Source code in core/git_operations.py

async def smart_auto_commit(
    workspace: str,
    project_root: str | None = None,
    task_description: str = "",
    files_written: list[str] | None = None,
) -> dict:
    """Commit automático con mensaje generado por LLM basado en la tarea.

    Si task_description está vacío, usa el mensaje por defecto.
    Si hay LLM disponible, genera un resumen de una línea de los cambios.
    """
    message = "Auto-commit: tarea completada"

    if task_description:
        try:
            message = await _generate_commit_message(task_description, files_written or [])
        except Exception:
            logger.debug("No se pudo generar mensaje de commit vía LLM, usando default")

    return await auto_commit(
        workspace=workspace,
        project_root=project_root,
        message=message,
    )

core.hooks_registry ¶

Classes¶

HookContext `dataclass` ¶

Immutable context passed to every hook invocation.

Source code in core/hooks_registry.py

@dataclass
class HookContext:
    """Immutable context passed to every hook invocation."""

    hook_point: str
    tool_name: str
    parameters: dict[str, Any] = field(default_factory=dict)
    role: str = "agent"
    result: Any = None
    error: str | None = None
    duration: float = 0.0
    attempt: int = 1
    workspace: str = "main"
    session_id: str | None = None

HooksRegistry ¶

Registry for hook callables organized by hook point name.

Mirrors ToolsRegistry pattern: decorator-based registration, global + workspace-scoped via load/unload lifecycle.

Source code in core/hooks_registry.py

class HooksRegistry:
    """Registry for hook callables organized by hook point name.

    Mirrors ToolsRegistry pattern: decorator-based registration,
    global + workspace-scoped via load/unload lifecycle.
    """

    def __init__(self):
        self._hooks: dict[str, list[Callable]] = {}
        self._source_map: dict[int, str] = {}

    def register(self, hook_point: str) -> Callable:
        """Decorator: @hooks_registry.register('on_before_tool')"""

        def decorator(func: Callable) -> Callable:
            handlers = self._hooks.setdefault(hook_point, [])
            if func not in handlers:
                handlers.append(func)
                logger.info(f"Hook registered: {func.__name__} -> {hook_point}")
            self._source_map[id(func)] = hook_point
            return func

        return decorator

    async def dispatch(self, hook_point: str, context: HookContext) -> None:
        """Invoke all hooks registered for hook_point. Exceptions are caught and logged."""
        handlers = self._hooks.get(hook_point, [])
        if not handlers:
            return

        context.hook_point = hook_point

        for hook in handlers:
            try:
                if asyncio.iscoroutinefunction(hook):
                    await hook(context)
                else:
                    hook(context)
            except Exception:
                logger.warning(
                    f"Hook {hook.__name__} at '{hook_point}' failed",
                    exc_info=True,
                )

    def unregister(self, hook_point: str, func: Callable) -> bool:
        """Remove a single hook from a hook point."""
        handlers = self._hooks.get(hook_point)
        if handlers and func in handlers:
            handlers.remove(func)
            if not handlers:
                del self._hooks[hook_point]
            logger.info(f"Hook unregistered: {func.__name__} from {hook_point}")
            return True
        return False

    def clear_hook_point(self, hook_point: str) -> None:
        """Remove all hooks for a given point."""
        self._hooks.pop(hook_point, None)

    def clear(self) -> None:
        """Remove all hooks (used on workspace switch to clean workspace hooks)."""
        self._hooks.clear()
        self._source_map.clear()
        logger.info("All hooks cleared from registry")

    def list_hooks(self) -> dict[str, list[str]]:
        """Return {hook_point: [function_names]} for introspection."""
        return {point: [h.__name__ for h in handlers] for point, handlers in self._hooks.items()}

Functions¶

register ¶

register(hook_point: str) -> Callable

Decorator: @hooks_registry.register('on_before_tool')

Source code in core/hooks_registry.py

def register(self, hook_point: str) -> Callable:
    """Decorator: @hooks_registry.register('on_before_tool')"""

    def decorator(func: Callable) -> Callable:
        handlers = self._hooks.setdefault(hook_point, [])
        if func not in handlers:
            handlers.append(func)
            logger.info(f"Hook registered: {func.__name__} -> {hook_point}")
        self._source_map[id(func)] = hook_point
        return func

    return decorator

dispatch `async` ¶

dispatch(hook_point: str, context: HookContext) -> None

Invoke all hooks registered for hook_point. Exceptions are caught and logged.

Source code in core/hooks_registry.py

async def dispatch(self, hook_point: str, context: HookContext) -> None:
    """Invoke all hooks registered for hook_point. Exceptions are caught and logged."""
    handlers = self._hooks.get(hook_point, [])
    if not handlers:
        return

    context.hook_point = hook_point

    for hook in handlers:
        try:
            if asyncio.iscoroutinefunction(hook):
                await hook(context)
            else:
                hook(context)
        except Exception:
            logger.warning(
                f"Hook {hook.__name__} at '{hook_point}' failed",
                exc_info=True,
            )

unregister ¶

unregister(hook_point: str, func: Callable) -> bool

Remove a single hook from a hook point.

Source code in core/hooks_registry.py

def unregister(self, hook_point: str, func: Callable) -> bool:
    """Remove a single hook from a hook point."""
    handlers = self._hooks.get(hook_point)
    if handlers and func in handlers:
        handlers.remove(func)
        if not handlers:
            del self._hooks[hook_point]
        logger.info(f"Hook unregistered: {func.__name__} from {hook_point}")
        return True
    return False

clear_hook_point ¶

clear_hook_point(hook_point: str) -> None

Remove all hooks for a given point.

Source code in core/hooks_registry.py

def clear_hook_point(self, hook_point: str) -> None:
    """Remove all hooks for a given point."""
    self._hooks.pop(hook_point, None)

clear ¶

clear() -> None

Remove all hooks (used on workspace switch to clean workspace hooks).

Source code in core/hooks_registry.py

def clear(self) -> None:
    """Remove all hooks (used on workspace switch to clean workspace hooks)."""
    self._hooks.clear()
    self._source_map.clear()
    logger.info("All hooks cleared from registry")

list_hooks ¶

list_hooks() -> dict[str, list[str]]

Return {hook_point: [function_names]} for introspection.

Source code in core/hooks_registry.py

def list_hooks(self) -> dict[str, list[str]]:
    """Return {hook_point: [function_names]} for introspection."""
    return {point: [h.__name__ for h in handlers] for point, handlers in self._hooks.items()}

core.hook_loader ¶

Functions¶

load_global_hooks ¶

load_global_hooks() -> None

Load global hooks from core/hooks/.

Source code in core/hook_loader.py

def load_global_hooks() -> None:
    """Load global hooks from core/hooks/."""
    global_dir = Path(__file__).parent / "hooks"
    if not global_dir.exists():
        logger.info("No global hooks directory found")
        return
    for py_file in sorted(global_dir.glob("*.py")):
        if py_file.name.startswith("_"):
            continue
        logger.info(f"Loading global hook: {py_file.name}")
        _import_module_from_file(f"core.hooks.{py_file.stem}", py_file)

load_workspace_hooks ¶

load_workspace_hooks(workspace: str) -> None

Load workspace-local hooks from workspaces//hooks/. Uses pre/post snapshot diff to track which hooks were added by the workspace.

Source code in core/hook_loader.py

def load_workspace_hooks(workspace: str) -> None:
    """Load workspace-local hooks from workspaces/<name>/hooks/.
    Uses pre/post snapshot diff to track which hooks were added by the workspace.
    """
    from core.hooks_registry import hooks_registry

    local_dir = paths.workspace_hooks_dir(workspace)
    if not local_dir.exists():
        logger.info(f"No hooks directory for workspace '{workspace}'")
        return

    # Snapshot current registry state
    pre_snapshot = {
        hook_point: list(handlers) for hook_point, handlers in hooks_registry._hooks.items()
    }

    modules_loaded: list[str] = []
    for py_file in sorted(local_dir.glob("*.py")):
        if py_file.name.startswith("_"):
            continue
        full_name = f"workspaces.{workspace}.hooks.{py_file.stem}"
        if _import_module_from_file(full_name, py_file):
            modules_loaded.append(full_name)

    # Diff: find newly registered hooks
    post_snapshot = {
        hook_point: list(handlers) for hook_point, handlers in hooks_registry._hooks.items()
    }

    workspace_refs: list[tuple[str, Callable]] = []
    for hook_point, handlers in post_snapshot.items():
        pre_handlers = pre_snapshot.get(hook_point, [])
        for handler in handlers:
            if handler not in pre_handlers:
                workspace_refs.append((hook_point, handler))

    _workspace_hook_refs[workspace] = workspace_refs
    _workspace_hook_modules[workspace] = modules_loaded
    logger.info(f"Loaded {len(workspace_refs)} workspace hook(s) for '{workspace}'")

unload_workspace_hooks ¶

unload_workspace_hooks() -> None

Remove only workspace-scoped hooks from registry and sys.modules.

Source code in core/hook_loader.py

def unload_workspace_hooks() -> None:
    """Remove only workspace-scoped hooks from registry and sys.modules."""
    from core.hooks_registry import hooks_registry

    for workspace_name, refs in list(_workspace_hook_refs.items()):
        for hook_point, func in refs:
            hooks_registry.unregister(hook_point, func)
        logger.debug(f"Unloaded {len(refs)} hook(s) from workspace '{workspace_name}'")

    for _workspace_name, module_names in list(_workspace_hook_modules.items()):
        for full_name in module_names:
            if full_name in sys.modules:
                del sys.modules[full_name]

    _workspace_hook_refs.clear()
    _workspace_hook_modules.clear()

core.lru_cache ¶

LRU Cache — thread-safe, TTL, tamaño limitado.

Usado por TaskAnalyzer y AgentRouter para cachear resultados de LLM.

Classes¶

LRUCache ¶

Source code in core/lru_cache.py

class LRUCache:
    def __init__(self, max_size: int = 500, ttl: int = 300):
        self._cache: OrderedDict = OrderedDict()
        self._max_size = max_size
        self._ttl = ttl
        self._lock = threading.RLock()

    def get(self, key: str) -> Any | None:
        """Retorna valor cacheado si existe y no expiró. None si no."""
        with self._lock:
            if key not in self._cache:
                return None
            value, timestamp = self._cache[key]
            if time.time() - timestamp > self._ttl:
                self._cache.pop(key, None)
                return None
            self._cache.move_to_end(key)
            return value

    def set(self, key: str, value: Any) -> None:
        """Guarda valor en cache con timestamp actual."""
        with self._lock:
            if key in self._cache:
                self._cache.move_to_end(key)
            self._cache[key] = (value, time.time())
            # Evict LRU if exceeds size
            while len(self._cache) > self._max_size:
                self._cache.popitem(last=False)

    def clear_expired(self) -> int:
        """Elimina entradas expiradas. Retorna cuántas eliminó."""
        with self._lock:
            now = time.time()
            expired = [k for k, (_, ts) in list(self._cache.items()) if now - ts > self._ttl]
            for k in expired:
                self._cache.pop(k, None)
            return len(expired)

    def __len__(self) -> int:
        with self._lock:
            return len(self._cache)

Functions¶

get ¶

get(key: str) -> Any | None

Retorna valor cacheado si existe y no expiró. None si no.

Source code in core/lru_cache.py

def get(self, key: str) -> Any | None:
    """Retorna valor cacheado si existe y no expiró. None si no."""
    with self._lock:
        if key not in self._cache:
            return None
        value, timestamp = self._cache[key]
        if time.time() - timestamp > self._ttl:
            self._cache.pop(key, None)
            return None
        self._cache.move_to_end(key)
        return value

set ¶

set(key: str, value: Any) -> None

Guarda valor en cache con timestamp actual.

Source code in core/lru_cache.py

def set(self, key: str, value: Any) -> None:
    """Guarda valor en cache con timestamp actual."""
    with self._lock:
        if key in self._cache:
            self._cache.move_to_end(key)
        self._cache[key] = (value, time.time())
        # Evict LRU if exceeds size
        while len(self._cache) > self._max_size:
            self._cache.popitem(last=False)

clear_expired ¶

clear_expired() -> int

Elimina entradas expiradas. Retorna cuántas eliminó.

Source code in core/lru_cache.py

def clear_expired(self) -> int:
    """Elimina entradas expiradas. Retorna cuántas eliminó."""
    with self._lock:
        now = time.time()
        expired = [k for k, (_, ts) in list(self._cache.items()) if now - ts > self._ttl]
        for k in expired:
            self._cache.pop(k, None)
        return len(expired)

core.metrics ¶

Metrics — contadores de uso del sistema.

Métricas acumulativas: tokens, workflows, herramientas. Métricas por herramienta: éxito/fallo, latencia. Expuestas via comando :stats en CLI y panel desktop.

Classes¶

Metrics `dataclass` ¶

Source code in core/metrics.py

@dataclass
class Metrics:
    _lock: threading.Lock = field(default_factory=threading.Lock, repr=False)
    total_tokens: int = 0
    total_workflows: int = 0
    completed_workflows: int = 0
    failed_workflows: int = 0
    tool_calls: int = 0
    llm_calls: int = 0
    rate_limited: int = 0
    start_time: float = field(default_factory=time.time)
    # Cache metrics (DeepSeek prompt caching)
    cache_hit_tokens: int = 0
    cache_miss_tokens: int = 0
    total_prompt_tokens: int = 0
    total_completion_tokens: int = 0

    def record_workflow_completed(self, tokens: int = 0, tool_calls: int = 0) -> None:
        with self._lock:
            self.total_workflows += 1
            self.completed_workflows += 1
            self.total_tokens += tokens
            self.tool_calls += tool_calls

    def record_workflow_failed(self) -> None:
        with self._lock:
            self.total_workflows += 1
            self.failed_workflows += 1

    def record_llm_call(self) -> None:
        with self._lock:
            self.llm_calls += 1

    def record_llm_usage(
        self,
        prompt_tokens: int = 0,
        completion_tokens: int = 0,
        cache_hit_tokens: int = 0,
        cache_miss_tokens: int = 0,
    ) -> None:
        """Record per-call token usage including cache hit/miss from DeepSeek."""
        with self._lock:
            self.total_prompt_tokens += prompt_tokens
            self.total_completion_tokens += completion_tokens
            self.total_tokens += prompt_tokens + completion_tokens
            self.cache_hit_tokens += cache_hit_tokens
            self.cache_miss_tokens += cache_miss_tokens

    def record_rate_limited(self) -> None:
        with self._lock:
            self.rate_limited += 1

    def to_dict(self) -> dict:
        with self._lock:
            uptime = int(time.time() - self.start_time)
            total_cache = self.cache_hit_tokens + self.cache_miss_tokens
            cache_hit_rate = (
                round(self.cache_hit_tokens / total_cache * 100, 1) if total_cache > 0 else 0.0
            )
            return {
                "uptime_seconds": uptime,
                "total_tokens": self.total_tokens,
                "total_workflows": self.total_workflows,
                "completed_workflows": self.completed_workflows,
                "failed_workflows": self.failed_workflows,
                "success_rate": f"{self.completed_workflows / max(self.total_workflows, 1) * 100:.1f}%",
                "tool_calls": self.tool_calls,
                "llm_calls": self.llm_calls,
                "rate_limited": self.rate_limited,
                "cache_hit_tokens": self.cache_hit_tokens,
                "cache_miss_tokens": self.cache_miss_tokens,
                "cache_hit_rate_pct": cache_hit_rate,
                "tokens_saved": self.cache_hit_tokens,
            }

Functions¶

record_llm_usage ¶

record_llm_usage(
    prompt_tokens: int = 0,
    completion_tokens: int = 0,
    cache_hit_tokens: int = 0,
    cache_miss_tokens: int = 0,
) -> None

Record per-call token usage including cache hit/miss from DeepSeek.

Source code in core/metrics.py

def record_llm_usage(
    self,
    prompt_tokens: int = 0,
    completion_tokens: int = 0,
    cache_hit_tokens: int = 0,
    cache_miss_tokens: int = 0,
) -> None:
    """Record per-call token usage including cache hit/miss from DeepSeek."""
    with self._lock:
        self.total_prompt_tokens += prompt_tokens
        self.total_completion_tokens += completion_tokens
        self.total_tokens += prompt_tokens + completion_tokens
        self.cache_hit_tokens += cache_hit_tokens
        self.cache_miss_tokens += cache_miss_tokens

ToolMetrics `dataclass` ¶

Métricas por herramienta: éxito/fallo y latencia.

Source code in core/metrics.py

@dataclass
class ToolMetrics:
    """Métricas por herramienta: éxito/fallo y latencia."""

    _lock: threading.Lock = field(default_factory=threading.Lock, repr=False)
    _calls: dict[str, dict] = field(default_factory=dict)

    def record_call(self, tool_name: str, success: bool, latency_ms: float) -> None:
        """Registra una llamada a herramienta con su resultado y latencia."""
        with self._lock:
            if tool_name not in self._calls:
                self._calls[tool_name] = {
                    "total": 0,
                    "success": 0,
                    "failure": 0,
                    "latency_ms_total": 0.0,
                    "latency_ms_max": 0.0,
                }
            entry = self._calls[tool_name]
            entry["total"] += 1
            entry["latency_ms_total"] += latency_ms
            entry["latency_ms_max"] = max(entry["latency_ms_max"], latency_ms)
            if success:
                entry["success"] += 1
            else:
                entry["failure"] += 1

    def get_tool_stats(self, tool_name: str) -> dict | None:
        """Devuelve las métricas de una herramienta o None."""
        with self._lock:
            entry = self._calls.get(tool_name)
            if entry is None:
                return None
            return self._format_entry(tool_name, entry)

    def get_all_stats(self) -> dict[str, dict]:
        """Devuelve métricas de todas las herramientas."""
        with self._lock:
            return {name: self._format_entry(name, e) for name, e in self._calls.items()}

    def get_summary(self) -> dict:
        """Resumen agregado de todas las herramientas."""
        with self._lock:
            total = sum(e["total"] for e in self._calls.values())
            success = sum(e["success"] for e in self._calls.values())
            failure = sum(e["failure"] for e in self._calls.values())
            return {
                "total_calls": total,
                "success": success,
                "failure": failure,
                "success_rate_pct": round(success / max(total, 1) * 100, 1),
                "tools_tracked": len(self._calls),
            }

    def to_dict(self) -> dict:
        """Métricas completas serializables."""
        return {
            "summary": self.get_summary(),
            "tools": self.get_all_stats(),
        }

    @staticmethod
    def _format_entry(name: str, entry: dict) -> dict:
        total = max(entry["total"], 1)
        return {
            "tool": name,
            "calls": entry["total"],
            "success": entry["success"],
            "failure": entry["failure"],
            "success_rate_pct": round(entry["success"] / total * 100, 1),
            "avg_latency_ms": round(entry["latency_ms_total"] / total, 1),
            "max_latency_ms": round(entry["latency_ms_max"], 1),
        }

Functions¶

record_call ¶

record_call(
    tool_name: str, success: bool, latency_ms: float
) -> None

Registra una llamada a herramienta con su resultado y latencia.

Source code in core/metrics.py

def record_call(self, tool_name: str, success: bool, latency_ms: float) -> None:
    """Registra una llamada a herramienta con su resultado y latencia."""
    with self._lock:
        if tool_name not in self._calls:
            self._calls[tool_name] = {
                "total": 0,
                "success": 0,
                "failure": 0,
                "latency_ms_total": 0.0,
                "latency_ms_max": 0.0,
            }
        entry = self._calls[tool_name]
        entry["total"] += 1
        entry["latency_ms_total"] += latency_ms
        entry["latency_ms_max"] = max(entry["latency_ms_max"], latency_ms)
        if success:
            entry["success"] += 1
        else:
            entry["failure"] += 1

get_tool_stats ¶

get_tool_stats(tool_name: str) -> dict | None

Devuelve las métricas de una herramienta o None.

Source code in core/metrics.py

def get_tool_stats(self, tool_name: str) -> dict | None:
    """Devuelve las métricas de una herramienta o None."""
    with self._lock:
        entry = self._calls.get(tool_name)
        if entry is None:
            return None
        return self._format_entry(tool_name, entry)

get_all_stats ¶

get_all_stats() -> dict[str, dict]

Devuelve métricas de todas las herramientas.

Source code in core/metrics.py

def get_all_stats(self) -> dict[str, dict]:
    """Devuelve métricas de todas las herramientas."""
    with self._lock:
        return {name: self._format_entry(name, e) for name, e in self._calls.items()}

get_summary ¶

get_summary() -> dict

Resumen agregado de todas las herramientas.

Source code in core/metrics.py

def get_summary(self) -> dict:
    """Resumen agregado de todas las herramientas."""
    with self._lock:
        total = sum(e["total"] for e in self._calls.values())
        success = sum(e["success"] for e in self._calls.values())
        failure = sum(e["failure"] for e in self._calls.values())
        return {
            "total_calls": total,
            "success": success,
            "failure": failure,
            "success_rate_pct": round(success / max(total, 1) * 100, 1),
            "tools_tracked": len(self._calls),
        }

to_dict ¶

to_dict() -> dict

Métricas completas serializables.

Source code in core/metrics.py

def to_dict(self) -> dict:
    """Métricas completas serializables."""
    return {
        "summary": self.get_summary(),
        "tools": self.get_all_stats(),
    }

core.models ¶

core.utils ¶

Utilidades generales de Morphix

Functions¶

clean_llm_response ¶

clean_llm_response(response: Any) -> str

Limpieza ULTRA-agresiva de respuestas del LLM. Versión canónica — fusiona la detección de coroutine (memory/manager.py) y el regex eval_count (workflow_utils.py).

Source code in core/utils.py

def clean_llm_response(response: Any) -> str:
    """Limpieza ULTRA-agresiva de respuestas del LLM.
    Versión canónica — fusiona la detección de coroutine (memory/manager.py)
    y el regex eval_count (workflow_utils.py)."""
    if hasattr(response, "__await__"):
        logger.error("⚠️ Se detectó un coroutine sin await en clean_llm_response")
        return "[ERROR INTERNO: llamada async sin await]"

    try:
        if hasattr(response, "choices") and response.choices:
            content = response.choices[0].message.content.strip()
        elif hasattr(response, "message") and hasattr(response.message, "content"):
            content = response.message.content.strip()
        else:
            content = str(response)

        content = re.sub(r"model=.*?(?=content=)", "", content, flags=re.DOTALL | re.IGNORECASE)
        content = re.sub(r"created_at=.*?(?=\n|$)", "", content, flags=re.DOTALL)
        content = re.sub(r"thinking=.*?(?=\n|$)", "", content, flags=re.DOTALL)
        content = re.sub(r"total_duration=.*?(?=\n|$)", "", content, flags=re.DOTALL)
        content = re.sub(r"eval_count=.*?(?=\n|$)", "", content, flags=re.DOTALL)

        match = re.search(r"content='([\s\S]*?)'", content)
        if match:
            content = match.group(1).strip()

        return content.strip()
    except (AttributeError, TypeError, KeyError):
        return str(response)[:800]

core.workspaces ¶

Classes¶

Workspaces ¶

Source code in core/workspaces.py

class Workspaces:
    def __init__(self):
        self.current = "main"
        self._switch_lock = asyncio.Lock()

    async def list_workspaces(self) -> list[str]:
        try:
            return await list_schemas()
        except Exception as e:
            logger.exception("Error listing schemas")
            return []

    async def switch_workspace(self, name: str, retries: int = 1) -> bool:
        if not name or not name.strip():
            logger.error("Empty workspace name, using 'main'")
            name = "main"
        name = self._validate_workspace_name(name)

        async with self._switch_lock:
            return await self._do_switch_workspace(name, retries)

    async def _do_switch_workspace(self, name: str, retries: int) -> bool:

        while retries >= 0:
            if retries == 0 and name != "main":
                name = "main"
            try:
                await create_schema(name)
                await create_tables_in_schema(name)
                await set_async_schema(name)

                await memory.switch_workspace(name)

                from agents.loader import load_workspace_agents, unload_workspace_agents
                from core.path_resolver import paths

                # Copy agent and workflow templates if workspace is new
                agents_dir = paths.workspace_agents_dir(name)
                templates_agents_dir = paths.templates_agents_dir()
                if not agents_dir.exists() or not any(agents_dir.iterdir()):
                    self._bootstrap_workspace_agents(agents_dir, templates_agents_dir)

                workflows_dir = paths.workspace_workflows_dir(name)
                templates_wf_dir = paths.templates_workflows_dir()
                if not workflows_dir.exists() or not any(workflows_dir.iterdir()):
                    self._bootstrap_workspace_workflows(workflows_dir, templates_wf_dir)

                hooks_dir = paths.workspace_hooks_dir(name)
                templates_hooks_dir = paths.templates_hooks_dir()
                if not hooks_dir.exists() or not any(hooks_dir.iterdir()):
                    self._bootstrap_workspace_hooks(hooks_dir, templates_hooks_dir)

                unload_workspace_agents()
                load_workspace_agents(name)

                from tools.loader import load_workspace_tools, unload_workspace_tools

                unload_workspace_tools()
                load_workspace_tools(name)

                from core.hook_loader import load_workspace_hooks, unload_workspace_hooks

                unload_workspace_hooks()
                load_workspace_hooks(name)

                from core.mcp.client import connect_mcp_servers, disconnect_mcp_servers

                await disconnect_mcp_servers()
                await connect_mcp_servers(name)

                self.current = name
                switch_workflow_state(name)

                logger.info(f"Switched to {name}")
                return True
            except Exception as e:
                retries -= 1
                if name != "main":
                    logger.warning(f"Fallback a 'main' desde '{name}': {e}")
                    name = "main"
                    retries = max(retries, 0)
                else:
                    logger.critical(f"switch_workspace('main') falló: {e}", exc_info=True)
                    return False

        return False

    async def create_workspace(self, name: str) -> bool:
        """Crea el workspace (si no existe) y cambia a él."""
        return await self.switch_workspace(name)

    async def delete_workspace(self, name: str) -> bool:
        name = self._validate_workspace_name(name)
        if name == self.current:
            await self.switch_workspace("main")
        try:
            await drop_schema(name)
            logger.info(f"Deleted {name}")
            return True
        except Exception as e:
            logger.error(f"Delete error: {e}")
            return False

    @staticmethod
    def _validate_workspace_name(name: str) -> str:
        import re

        if not re.match(r"^[a-z][a-z0-9_]*$", name):
            raise ValueError(
                f"Nombre de workspace inválido: '{name}'. "
                "Solo se permiten minúsculas, números y guiones bajos, empezando con letra."
            )
        return name

    @staticmethod
    def _bootstrap_workspace_agents(agents_dir, templates_dir):
        """Copia los templates de agentes a un workspace nuevo."""
        import shutil

        if not templates_dir.exists():
            logger.info("No hay templates de agentes disponibles")
            return

        agents_dir.mkdir(parents=True, exist_ok=True)
        copied = 0
        for template_file in templates_dir.glob("*.yaml"):
            dest = agents_dir / template_file.name
            if not dest.exists():
                shutil.copy2(template_file, dest)
                copied += 1

        if copied:
            logger.info(f"Bootstrap: {copied} agentes copiados a {agents_dir}")
        else:
            logger.info(f"Agentes ya existen en {agents_dir}, sin cambios")

    @staticmethod
    def _bootstrap_workspace_workflows(workflows_dir, templates_dir):
        """Copia los templates de workflows a un workspace nuevo."""
        import shutil

        if not templates_dir.exists():
            logger.info("No hay templates de workflows disponibles")
            return

        workflows_dir.mkdir(parents=True, exist_ok=True)
        copied = 0
        for template_file in templates_dir.glob("*.yaml"):
            dest = workflows_dir / template_file.name
            if not dest.exists():
                shutil.copy2(template_file, dest)
                copied += 1

        if copied:
            logger.info(f"Bootstrap: {copied} workflows copiados a {workflows_dir}")
        else:
            logger.info(f"Workflows ya existen en {workflows_dir}, sin cambios")

    @staticmethod
    def _bootstrap_workspace_hooks(hooks_dir, templates_dir):
        """Copia los templates de hooks a un workspace nuevo."""
        import shutil

        if not templates_dir.exists():
            logger.info("No hay templates de hooks disponibles")
            return

        hooks_dir.mkdir(parents=True, exist_ok=True)
        copied = 0
        for template_file in templates_dir.glob("*.py"):
            dest = hooks_dir / template_file.name
            if not dest.exists():
                shutil.copy2(template_file, dest)
                copied += 1

        if copied:
            logger.info(f"Bootstrap: {copied} hooks copiados a {hooks_dir}")
        else:
            logger.info(f"Hooks ya existen en {hooks_dir}, sin cambios")

Functions¶

create_workspace `async` ¶

create_workspace(name: str) -> bool

Crea el workspace (si no existe) y cambia a él.

Source code in core/workspaces.py

async def create_workspace(self, name: str) -> bool:
    """Crea el workspace (si no existe) y cambia a él."""
    return await self.switch_workspace(name)

Functions¶

core.workflow_state ¶

Tracks the active workflow per workspace (remembers last selection in each).

Functions¶

set_active_workflow ¶

set_active_workflow(name: str) -> None

Set the active workflow for the current workspace.

Source code in core/workflow_state.py

def set_active_workflow(name: str) -> None:
    """Set the active workflow for the current workspace."""
    with _lock:
        _workflow_map[_current_workspace] = name

get_active_workflow ¶

get_active_workflow() -> str

Get the active workflow for the current workspace.

Source code in core/workflow_state.py

def get_active_workflow() -> str:
    """Get the active workflow for the current workspace."""
    with _lock:
        default = settings.default_workflow or "default"
        return _workflow_map.get(_current_workspace, default)

switch_workspace ¶

switch_workspace(workspace: str) -> None

Update current workspace without losing saved preferences.

Source code in core/workflow_state.py

def switch_workspace(workspace: str) -> None:
    """Update current workspace without losing saved preferences."""
    global _current_workspace
    with _lock:
        _current_workspace = workspace

core.memory.manager ¶

MemoryManager - Sistema de 3 Capas Self-Healing (VERSIÓN FINAL ROBUSTA Y ESTABLE) Aislamiento por workspace: subdirectorios memory/{workspace}/

Classes¶

MemoryManager ¶

Source code in core/memory/manager.py

class MemoryManager:
    _PROTECTED_EXACT: set[str] = {
        "kairos_daemon_heartbeat",
        "user_profile",
        "user_profile_last_update",
        "security_private",
        "last_creative_output",
        "last_analysis",
        "last_plan",
        "last_connection",
        "last_successful_code",
    }
    _PROTECTED_PREFIXES: tuple[str, ...] = ("workflow_subtask_", "last_", "merged_")

    _instance = None
    _lock = threading.RLock()

    def __new__(cls):
        if cls._instance is None:
            with cls._lock:
                if cls._instance is None:
                    cls._instance = super().__new__(cls)
                    cls._instance._init_memory()
        return cls._instance

    def _init_memory(self):
        from core.path_resolver import paths

        self.base_dir = paths.memory_base()
        self.base_dir.mkdir(parents=True, exist_ok=True)
        self.active_workspace = None
        self.documents: list[tuple[str, Any]] = []
        self.index = faiss.IndexFlatL2(FAISS_DIMENSION)
        self.embedder = EmbeddingProvider  # lazy — carga en background
        self._access_log: dict[str, float] = {}  # key -> last access timestamp
        logger.info("✅ Memoria 3-capas inicializada (embeddings en carga lazy)")

    def _embed(self, text: str):
        """Wrapper que espera al modelo si aún no está listo."""
        if not self.embedder.wait_until_ready(timeout=60):
            logger.warning("Modelo de embeddings no disponible tras timeout")
            return None
        return self.embedder.encode(text)

    # ==================== HELPERS ====================
    def get_user_summary(self) -> str:
        profile = self.get_user_profile()
        if not profile or not any(profile.values()):
            return ""
        lines = [
            f"- {k.replace('_', ' ').title()}: {v}"
            for k, v in profile.items()
            if v and k != "preferences"
        ]
        return "\n".join(lines)

    def get_long_context_summary(self, history: list, max_facts: int = 8) -> str:
        if len(history) <= 10:
            return ""
        facts = []
        for msg in history[:-10]:
            content = msg.get("content", "").strip()
            if content and len(content) > 15:
                facts.append(content[:250])
        if not facts:
            return ""
        return "\n".join(f"- {f}" for f in facts[:max_facts])

    async def save_user_correction(self, original_task: str, correction: str) -> bool:
        key = f"correction_{hash(original_task) % 100000}"
        value = {
            "original": original_task[:300],
            "correction": correction[:800],
            "timestamp": int(time.time()),
        }
        return await self.write(key, value, validated=True, content_hint="analytical")

    # ==================== CAMBIO DE WORKSPACE ====================
    async def switch_workspace(self, workspace: str):
        """Switch to the given workspace, loading its documents and index.
        Embedding computation runs in a thread pool to avoid blocking the event loop."""
        with self._lock:
            if self.active_workspace == workspace:
                return

            old_ws = self.active_workspace
            old_docs = self.documents
            old_index = self.index

            try:
                ws_dir = self.base_dir / workspace
                ws_dir.mkdir(parents=True, exist_ok=True)

                # Read files under lock (fast I/O)
                file_entries: list[tuple[str, Any]] = []
                for file in ws_dir.glob("*.md"):
                    with open(file, encoding="utf-8") as f:
                        content = f.read().strip()
                    key = file.stem
                    val = json.loads(content) if content.startswith("{") else content
                    file_entries.append((key, val))
            except Exception as e:
                logger.warning("Unhandled exception in MemoryManager", exc_info=True)
                self.active_workspace = old_ws
                self.documents = old_docs
                self.index = old_index
                raise RuntimeError(f"Error switching to workspace '{workspace}': {e}")

        # Compute embeddings in thread pool (slow operation, non-blocking for async)
        def _build_index():
            new_index = faiss.IndexFlatL2(FAISS_DIMENSION)
            new_docs = []
            for key, val in file_entries:
                try:
                    emb = self._embed(str(val))
                    new_index.add(emb.reshape(1, -1))
                    new_docs.append((key, val))
                except Exception:
                    logger.warning("Error generating embedding for '%s', skipping", key)
            return new_index, new_docs

        new_index, new_docs = await asyncio.to_thread(_build_index)

        # Atomic swap of index and documents under lock
        with self._lock:
            self.active_workspace = workspace
            self.documents = new_docs
            self.index = new_index
            logger.info(f"🔄 Workspace switched to '{workspace}' ({len(new_docs)} documents)")

    # ==================== ESCRITURA EN SYSTEM (global) ====================
    async def write_system(self, key: str, value: Any) -> bool:
        """Escribe en memory/system/ sin interferir con el índice activo."""
        sys_dir = self.base_dir / "system"
        sys_dir.mkdir(exist_ok=True)
        file = sys_dir / f"{key}.md"
        with self._lock:
            try:
                with open(file, "w", encoding="utf-8") as f:
                    if isinstance(value, (dict, list)):
                        json.dump(value, f, indent=2, ensure_ascii=False)
                    else:
                        f.write(str(value))
                return True
            except Exception as e:
                logger.error(f"Error escribiendo en system/{key}: {e}")
                return False

    # ==================== ROBUST WRITE WITH ROLLBACK (FIXED) ====================
    async def write(
        self, key: str, value: Any, validated: bool = False, content_hint: str | None = None
    ) -> bool:
        if self.active_workspace is None:
            logger.error("No hay workspace activo. No se puede escribir en memoria.")
            return False

        score: int | str = "N/A"

        if not validated:
            critique = await self._llm_critique(key, value, content_hint)
            score = int(critique.get("quality_score", 0))  # type: ignore[no-redef]
            threshold: int = self._get_quality_threshold(content_hint, key)

            if score < threshold:
                logger.warning(f"❌ Write RECHAZADO: {key} (score: {score} < {threshold})")
                return False

            if critique.get("suggested_fix"):
                value = critique["suggested_fix"]
                logger.info(f"🔧 Auto-corrección aplicada a: {key}")

        # Pre-compute embedding OUTSIDE the lock to avoid blocking other
        # memory operations while the model generates the vector.
        embedding = self._embed(str(value))
        if embedding is None:
            logger.error(f"❌ Embedding no disponible para '{key}'")
            return False

        with self._lock:
            old_entry = next(((k, v) for k, v in self.documents if k == key), None)
            self.documents = [doc for doc in self.documents if doc[0] != key]

            ws_dir = self.base_dir / self.active_workspace
            ws_dir.mkdir(parents=True, exist_ok=True)
            file = ws_dir / f"{key}.md"
            file_created = False

            try:
                with open(file, "w", encoding="utf-8") as f:
                    if isinstance(value, (dict, list)):
                        f.write(json.dumps(value, indent=2, ensure_ascii=False))
                    else:
                        f.write(str(value))
                file_created = True

                self.index.add(embedding.reshape(1, -1))
                self.documents.append((key, value))
                self._access_log[key] = time.time()
            except Exception as e:
                logger.error(f"Error saving '{key}': {e}")
                # Always restore the previous entry
                if old_entry is not None:
                    self.documents.append(old_entry)
                    # Also restore the previous file content
                    try:
                        with open(file, "w", encoding="utf-8") as f:
                            old_val = old_entry[1]
                            if isinstance(old_val, (dict, list)):
                                json.dump(old_val, f, indent=2, ensure_ascii=False)
                            else:
                                f.write(str(old_val))
                    except Exception:
                        logger.debug("Rollback de archivo fallido en restauración", exc_info=True)
                    logger.info(f"↩️ Rollback completado para '{key}'")
                elif file_created and file.exists():
                    file.unlink()
                return False

        logger.info(f"✅ Memoria escrita: {key} (score: {score})")
        return True

    def _get_quality_threshold(self, content_hint: str | None, key: str) -> int:
        if key == "user_profile_last_update":
            return 15
        if key.startswith("workflow_subtask_"):
            return 20
        if content_hint == "creative":
            return 30
        if content_hint == "analytical":
            return 50
        return 40

    # ==================== LLM CRITIQUE ====================
    async def _llm_critique(self, key: str, value: Any, content_hint: str | None = None) -> dict:
        if not value or len(str(value).strip()) < 10:
            return {
                "quality_score": 0,
                "is_valid": False,
                "suggested_fix": "",
                "reason": "Contenido demasiado corto",
            }

        prompt = self._build_critique_prompt(key, value, content_hint)

        try:
            response = await models.call(
                messages=[{"role": "user", "content": prompt}],
                role="critique",
                temperature=0.0,
            )
            raw = clean_llm_response(response)
            data = self._parse_critique_response(raw)

            if not data:
                logger.warning(
                    f"⚠️ Parseo de crítica vacío para '{key}', usando valores por defecto"
                )
                data = {}

            return {
                "quality_score": int(float(data.get("quality_score", 50))),
                "is_valid": bool(data.get("is_valid", True)),
                "suggested_fix": data.get("suggested_fix", ""),
                "reason": data.get("reason", ""),
            }
        except Exception as e:
            logger.warning(f"Critique falló para '{key}': {e}")
            return {
                "quality_score": 60,
                "is_valid": True,
                "suggested_fix": "",
                "reason": f"Excepción: {e}",
            }

    def _build_critique_prompt(self, key: str, value: Any, content_hint: str | None = None) -> str:
        safe_value = str(value)[:1000]
        tipo = {
            "creative": "contenido CREATIVO",
            "analytical": "análisis",
        }.get(content_hint or "", "memoria")

        return f"""Evalúa la calidad de este {tipo}. Responde SOLO con JSON válido.
KEY: {key}
VALUE: {safe_value}
{{"quality_score": 0-100, "is_valid": true/false, "suggested_fix": "...", "reason": "..."}}"""

    def _parse_critique_response(self, raw: str) -> dict:
        data = parse_json_from_llm(raw)
        if data:
            return data
        # Fallback regex for individual fields
        data = {}
        score_match = re.search(r'"quality_score"\s*:\s*([\d.]+)', raw)
        if score_match:
            data["quality_score"] = float(score_match.group(1))
        valid_match = re.search(r'"is_valid"\s*:\s*(true|false)', raw, re.IGNORECASE)
        if valid_match:
            data["is_valid"] = valid_match.group(1).lower() == "true"
        return data

    # ==================== SELF-HEALING ====================
    async def _detect_duplicates(self) -> int:
        """Find and merge near-duplicate documents (FAISS similarity > 0.92).

        Returns number of duplicates removed.
        """
        removed = 0
        with self._lock:
            docs = list(self.documents)

        if len(docs) < 2:
            return 0

        seen: set[int] = set()
        for i, (key_a, val_a) in enumerate(docs):
            if i in seen:
                continue
            if key_a in self._PROTECTED_EXACT or any(
                key_a.startswith(p) for p in self._PROTECTED_PREFIXES
            ):
                continue
            try:
                emb_a = self._embed(str(val_a))
                if emb_a is None:
                    continue
                distances, indices = self.index.search(
                    emb_a.reshape(1, -1), min(5, self.index.ntotal)
                )
            except Exception:
                logger.warning(
                    "Unhandled exception in MemoryManager._detect_duplicates", exc_info=True
                )
                continue

            for dist, idx in zip(distances[0], indices[0], strict=False):
                if idx < 0 or idx >= len(docs) or idx == i or idx in seen:
                    continue
                similarity = 1.0 / (1.0 + float(dist))
                if similarity > 0.92:
                    key_b, val_b = docs[idx]
                    # Keep the document with higher quality score
                    crit_a = await self._llm_critique(key_a, val_a)
                    crit_b = await self._llm_critique(key_b, val_b)
                    score_a = crit_a.get("quality_score", 0)
                    score_b = crit_b.get("quality_score", 0)

                    if score_a >= score_b:
                        to_remove = (idx, key_b)
                        logger.info(
                            f"Duplicate merged: '{key_b}' → '{key_a}' (sim={similarity:.3f})"
                        )
                    else:
                        to_remove = (i, key_a)
                        logger.info(
                            f"Duplicate merged: '{key_a}' → '{key_b}' (sim={similarity:.3f})"
                        )

                    seen.add(to_remove[0])
                    with self._lock:
                        ws_dir = self.base_dir / self.active_workspace
                        file = ws_dir / f"{to_remove[1]}.md"
                        if file.exists():
                            file.unlink()
                        self.documents = [d for d in self.documents if d[0] != to_remove[1]]
                        self._access_log.pop(to_remove[1], None)
                    removed += 1
                    break  # Only remove one duplicate per source document

        if removed > 0:
            await self._rebuild_index()
        return removed

    async def _resolve_contradictions(self) -> int:
        """Detect contradictory document pairs and ask LLM to resolve.

        Returns number of contradictions resolved.
        """
        resolved = 0
        with self._lock:
            docs = list(self.documents)

        if len(docs) < 2:
            return 0

        # Find similar-but-not-identical pairs (similarity 0.65-0.92)
        checked: set[tuple[int, int]] = set()
        for i, (key_a, val_a) in enumerate(docs):
            if key_a in self._PROTECTED_EXACT or any(
                key_a.startswith(p) for p in self._PROTECTED_PREFIXES
            ):
                continue
            try:
                emb_a = self._embed(str(val_a))
                if emb_a is None:
                    continue
                distances, indices = self.index.search(
                    emb_a.reshape(1, -1), min(3, self.index.ntotal)
                )
            except Exception:
                logger.warning(
                    "Unhandled exception in MemoryManager._resolve_contradictions", exc_info=True
                )
                continue

            for dist, idx in zip(distances[0], indices[0], strict=False):
                if idx < 0 or idx >= len(docs) or idx == i:
                    continue
                pair = tuple(sorted([i, idx]))
                if pair in checked:
                    continue
                checked.add(pair)

                similarity = 1.0 / (1.0 + float(dist))
                if not (0.65 <= similarity <= 0.92):
                    continue

                key_b, val_b = docs[idx]
                resolution = await self._arbitrate_contradiction(key_a, val_a, key_b, val_b)
                if resolution is None:
                    continue

                resolved += 1
                # Write merged resolution, remove original pair
                await self.write(
                    f"merged_{key_a}_{key_b}"[:80],
                    resolution,
                    validated=True,
                )
                with self._lock:
                    ws_dir = self.base_dir / self.active_workspace
                    for rm_key in (key_a, key_b):
                        file = ws_dir / f"{rm_key}.md"
                        if file.exists():
                            file.unlink()
                        self.documents = [d for d in self.documents if d[0] != rm_key]
                        self._access_log.pop(rm_key, None)

        if resolved > 0:
            await self._rebuild_index()
        return resolved

    async def _arbitrate_contradiction(
        self, key_a: str, val_a: Any, key_b: str, val_b: Any
    ) -> str | None:
        """Ask LLM to reconcile two potentially contradictory facts."""
        prompt = (
            "You are a memory consolidation system. Two stored facts may contradict.\n"
            f"Fact A ({key_a}): {str(val_a)[:500]}\n"
            f"Fact B ({key_b}): {str(val_b)[:500]}\n\n"
            "If they DON'T contradict, reply with the single word: SKIP\n"
            "If they DO contradict or overlap, produce a SINGLE consolidated fact "
            "that resolves the conflict. Keep the consolidated fact under 300 characters. "
            "Reply with just the consolidated text, no quotes, no JSON."
        )
        try:
            response = await models.call(
                messages=[{"role": "user", "content": prompt}],
                role="critique",
                temperature=0.0,
            )
            text = clean_llm_response(response).strip()
            if text.upper().startswith("SKIP"):
                return None
            if len(text) > 10:
                logger.info(f"Contradiction resolved: '{key_a}' + '{key_b}' → merged")
                return text
        except Exception as e:
            logger.warning(f"Contradiction arbitration failed: {e}")
        return None

    async def _prune_stale(self, max_age_days: int = 30) -> int:
        """Remove documents not accessed in max_age_days (skipping protected keys)."""
        threshold = time.time() - (max_age_days * 86400)
        removed = 0

        with self._lock:
            stale_keys = []
            for key, _val in self.documents:
                if key in self._PROTECTED_EXACT or any(
                    key.startswith(p) for p in self._PROTECTED_PREFIXES
                ):
                    continue
                last_access = self._access_log.get(key, 0)
                if last_access < threshold:
                    stale_keys.append(key)

            if stale_keys:
                ws_dir = self.base_dir / self.active_workspace
                for key in stale_keys:
                    file = ws_dir / f"{key}.md"
                    if file.exists():
                        file.unlink()
                    self._access_log.pop(key, None)
                    logger.info(f"Pruned stale document: {key}")
                self.documents = [d for d in self.documents if d[0] not in stale_keys]
                removed = len(stale_keys)

        if removed > 0:
            await self._rebuild_index()
        return removed

    async def _rebuild_index(self) -> None:
        """Rebuild FAISS index from current documents (called after batch modifications)."""
        with self._lock:
            doc_snapshot = list(self.documents)

        precomputed: list = []
        for _, val in doc_snapshot:
            try:
                emb = self._embed(str(val))
                if emb is not None:
                    precomputed.append(emb)
            except Exception as e:
                logger.warning(f"Error generating embedding during index rebuild: {e}")

        with self._lock:
            self.index = faiss.IndexFlatL2(FAISS_DIMENSION)
            for emb in precomputed:
                self.index.add(emb.reshape(1, -1))
            logger.debug(f"FAISS index rebuilt: {self.index.ntotal} vectors")

    async def self_healing_check(self):
        if self.active_workspace is None:
            logger.info("Self-healing cancelado: sin workspace activo")
            return

        logger.info(f"🔧 Iniciando self-healing en workspace '{self.active_workspace}'...")

        with self._lock:
            documents_to_check = list(self.documents)[-20:]

        low_quality = []
        for key, value in documents_to_check:
            if key in self._PROTECTED_EXACT or any(
                key.startswith(p) for p in self._PROTECTED_PREFIXES
            ):
                continue
            critique = await self._llm_critique(key, value)
            if critique.get("quality_score", 0) < 60:
                low_quality.append((key, critique))
                logger.warning(
                    f"📉 Baja calidad detectada: {key} (score: {critique.get('quality_score')})"
                )

        for key, critique in low_quality:
            if critique.get("suggested_fix"):
                logger.info(f"🔧 Aplicando auto-corrección a {key}")
                await self.write(key, critique["suggested_fix"], validated=True)
            else:
                with self._lock:
                    ws_dir = self.base_dir / self.active_workspace
                    file = ws_dir / f"{key}.md"
                    if file.exists():
                        file.unlink()
                    self.documents = [doc for doc in self.documents if doc[0] != key]
                    self._access_log.pop(key, None)
                    logger.warning(f"🗑️ Eliminado por baja calidad: {key}")

        # Phase 2: Duplicate detection via FAISS similarity
        dup_count = await self._detect_duplicates()

        # Phase 3: Contradiction resolution via LLM arbitration
        contra_count = await self._resolve_contradictions()

        # Phase 4: Prune stale documents (30+ days unaccessed)
        pruned_count = await self._prune_stale(max_age_days=30)

        # Atomic index rebuild: take snapshot under lock,
        # precompute embeddings outside the lock, then rebuild
        # the index inside the lock with the precomputed embeddings.
        with self._lock:
            doc_snapshot = list(self.documents)

        # Precalcular embeddings FUERA del lock
        precomputed: list = []
        for _, val in doc_snapshot:
            try:
                emb = self._embed(str(val))
                if emb is not None:
                    precomputed.append(emb)
            except Exception as e:
                logger.warning(f"Error generando embedding durante self-healing: {e}")

        # Rebuild index inside the lock
        with self._lock:
            self.index = faiss.IndexFlatL2(FAISS_DIMENSION)
            for emb in precomputed:
                self.index.add(emb.reshape(1, -1))

        logger.info(
            f"✅ Self-healing completado en workspace '{self.active_workspace}' | "
            f"Revisados: {len(documents_to_check)} | Baja calidad: {len(low_quality)} | "
            f"Duplicados: {dup_count} | Contradicciones: {contra_count} | Poda: {pruned_count}"
        )

    # ==================== PUBLIC METHODS ====================
    def search(self, query: str, k: int = 5, min_similarity: float = 0.0) -> list[dict]:
        """Búsqueda semántica real usando FAISS. Retorna top-k documentos con scores."""
        query_emb = self._embed(query)
        if query_emb is None:
            return []
        with self._lock:
            if self.index is None or self.index.ntotal == 0:
                return []
            try:
                distances, indices = self.index.search(
                    query_emb.reshape(1, -1), min(k, self.index.ntotal)
                )
                results = []
                for dist, idx in zip(distances[0], indices[0], strict=False):
                    if idx < 0 or idx >= len(self.documents):
                        continue
                    if dist > min_similarity * 100 and min_similarity > 0:
                        continue
                    key, val = self.documents[idx]
                    self._access_log[key] = time.time()
                    results.append(
                        {
                            "key": key,
                            "value": val,
                            "distance": float(dist),
                            "similarity": round(1.0 / (1.0 + float(dist)), 4),
                        }
                    )
                return results
            except Exception as e:
                logger.error(f"Error en búsqueda semántica: {e}")
                return []

    def read(self, key: str) -> Any:
        with self._lock:
            for k, v in self.documents:
                if k == key:
                    self._access_log[key] = time.time()
                    return v
            return None

    def get_user_profile(self) -> dict:
        profile = self.read("user_profile")
        return (
            profile
            if isinstance(profile, dict)
            else {"name": None, "country": None, "preferences": {}}
        )

    async def update_user_profile(self, new_data: dict) -> bool:
        if not new_data:
            return False
        current = self.get_user_profile()
        updated = {**current, **new_data}
        return await self.write("user_profile", updated, validated=True)

Functions¶

switch_workspace `async` ¶

switch_workspace(workspace: str)

Switch to the given workspace, loading its documents and index. Embedding computation runs in a thread pool to avoid blocking the event loop.

Source code in core/memory/manager.py

async def switch_workspace(self, workspace: str):
    """Switch to the given workspace, loading its documents and index.
    Embedding computation runs in a thread pool to avoid blocking the event loop."""
    with self._lock:
        if self.active_workspace == workspace:
            return

        old_ws = self.active_workspace
        old_docs = self.documents
        old_index = self.index

        try:
            ws_dir = self.base_dir / workspace
            ws_dir.mkdir(parents=True, exist_ok=True)

            # Read files under lock (fast I/O)
            file_entries: list[tuple[str, Any]] = []
            for file in ws_dir.glob("*.md"):
                with open(file, encoding="utf-8") as f:
                    content = f.read().strip()
                key = file.stem
                val = json.loads(content) if content.startswith("{") else content
                file_entries.append((key, val))
        except Exception as e:
            logger.warning("Unhandled exception in MemoryManager", exc_info=True)
            self.active_workspace = old_ws
            self.documents = old_docs
            self.index = old_index
            raise RuntimeError(f"Error switching to workspace '{workspace}': {e}")

    # Compute embeddings in thread pool (slow operation, non-blocking for async)
    def _build_index():
        new_index = faiss.IndexFlatL2(FAISS_DIMENSION)
        new_docs = []
        for key, val in file_entries:
            try:
                emb = self._embed(str(val))
                new_index.add(emb.reshape(1, -1))
                new_docs.append((key, val))
            except Exception:
                logger.warning("Error generating embedding for '%s', skipping", key)
        return new_index, new_docs

    new_index, new_docs = await asyncio.to_thread(_build_index)

    # Atomic swap of index and documents under lock
    with self._lock:
        self.active_workspace = workspace
        self.documents = new_docs
        self.index = new_index
        logger.info(f"🔄 Workspace switched to '{workspace}' ({len(new_docs)} documents)")

write_system `async` ¶

write_system(key: str, value: Any) -> bool

Escribe en memory/system/ sin interferir con el índice activo.

Source code in core/memory/manager.py

async def write_system(self, key: str, value: Any) -> bool:
    """Escribe en memory/system/ sin interferir con el índice activo."""
    sys_dir = self.base_dir / "system"
    sys_dir.mkdir(exist_ok=True)
    file = sys_dir / f"{key}.md"
    with self._lock:
        try:
            with open(file, "w", encoding="utf-8") as f:
                if isinstance(value, (dict, list)):
                    json.dump(value, f, indent=2, ensure_ascii=False)
                else:
                    f.write(str(value))
            return True
        except Exception as e:
            logger.error(f"Error escribiendo en system/{key}: {e}")
            return False

search ¶

search(
    query: str, k: int = 5, min_similarity: float = 0.0
) -> list[dict]

Búsqueda semántica real usando FAISS. Retorna top-k documentos con scores.

Source code in core/memory/manager.py

def search(self, query: str, k: int = 5, min_similarity: float = 0.0) -> list[dict]:
    """Búsqueda semántica real usando FAISS. Retorna top-k documentos con scores."""
    query_emb = self._embed(query)
    if query_emb is None:
        return []
    with self._lock:
        if self.index is None or self.index.ntotal == 0:
            return []
        try:
            distances, indices = self.index.search(
                query_emb.reshape(1, -1), min(k, self.index.ntotal)
            )
            results = []
            for dist, idx in zip(distances[0], indices[0], strict=False):
                if idx < 0 or idx >= len(self.documents):
                    continue
                if dist > min_similarity * 100 and min_similarity > 0:
                    continue
                key, val = self.documents[idx]
                self._access_log[key] = time.time()
                results.append(
                    {
                        "key": key,
                        "value": val,
                        "distance": float(dist),
                        "similarity": round(1.0 / (1.0 + float(dist)), 4),
                    }
                )
            return results
        except Exception as e:
            logger.error(f"Error en búsqueda semántica: {e}")
            return []

Functions¶

core.mcp.server ¶

MCP server — expose Morphix tools over stdio JSON-RPC.

Usage

morphix mcp-server poetry run python -m core.mcp.server

Other MCP clients (opencode, Claude Desktop) can connect and use Morphix tools: file_manager, bash_manager, web_search, etc.

Classes¶

MCPServer ¶

Source code in core/mcp/server.py

class MCPServer:
    def __init__(self):
        self._initialized = False
        self._server_info = {"name": "morphix", "version": "1.0"}

    def _get_tools(self) -> list[dict]:
        """Collect all registered Morphix tools as MCP tool schemas."""
        from tools.specs import TOOL_DEFINITIONS

        tools = []
        for name, tdef in sorted(TOOL_DEFINITIONS.items()):
            tool_dict = {
                "name": name,
                "description": tdef.description,
                "parameters": tdef.parameters,
                "required": tdef.required,
            }
            tools.append(morphix_to_mcp_tool(tool_dict))
        return tools

    async def _handle_initialize(self, msg: dict) -> dict:
        params = msg.get("params", {})
        client_info = params.get("clientInfo", {})
        logger.info(
            f"MCP client connected: {client_info.get('name', 'unknown')} "
            f"v{client_info.get('version', '?')}"
        )
        self._initialized = True
        return {
            "protocolVersion": "2024-11-05",
            "capabilities": {"tools": {}},
            "serverInfo": self._server_info,
        }

    async def _handle_tools_list(self, msg: dict) -> dict:
        tools = self._get_tools()
        return {"tools": tools}

    async def _handle_tools_call(self, msg: dict) -> dict:
        params = msg.get("params", {})
        tool_name = params.get("name", "")
        arguments = params.get("arguments", {})

        if not tool_name:
            return build_error(msg.get("id"), -32602, "Missing tool name")

        from tools.wrapper import safe_tool_call

        try:
            result = await safe_tool_call(tool_name, arguments)
        except Exception as e:
            logger.exception(f"MCP tool '{tool_name}' failed")
            return {
                "content": [{"type": "text", "text": f"Tool error: {e}"}],
                "isError": True,
            }

        if isinstance(result, dict):
            output_text = str(result.get("output", result.get("error", str(result))))
            is_error = not result.get("success", False)
        else:
            output_text = str(result)
            is_error = False

        return {
            "content": [{"type": "text", "text": output_text}],
            "isError": is_error,
        }

    async def run(self) -> None:
        """Main loop: read JSON-RPC from stdin, respond on stdout."""
        reader = asyncio.StreamReader()
        protocol = asyncio.StreamReaderProtocol(reader)
        await asyncio.get_running_loop().connect_read_pipe(lambda: protocol, sys.stdin)

        write_transport, write_protocol = await asyncio.get_running_loop().connect_write_pipe(
            asyncio.streams.FlowControlMixin, sys.stdout.buffer
        )
        writer = asyncio.StreamWriter(
            write_transport, write_protocol, reader, asyncio.get_running_loop()
        )

        logger.info("MCP server ready (stdio)")
        handlers = {
            "initialize": self._handle_initialize,
            "tools/list": self._handle_tools_list,
            "tools/call": self._handle_tools_call,
        }

        try:
            while True:
                msg = await read_message(reader)

                if is_notification(msg):
                    method = msg.get("method", "")
                    if method == "notifications/initialized":
                        logger.info("MCP client initialized notification received")
                    continue

                msg_id = msg.get("id")
                method = msg.get("method", "")

                handler = handlers.get(method)
                if handler is None:
                    await write_message(
                        writer, build_error(msg_id, -32601, f"Method not found: {method}")
                    )
                    continue

                try:
                    result = await handler(msg)
                    if isinstance(result, dict) and "jsonrpc" in result:
                        await write_message(writer, result)
                    else:
                        await write_message(writer, build_response(msg_id or 0, result))
                except Exception as e:
                    logger.exception(f"MCP handler '{method}' error")
                    await write_message(writer, build_error(msg_id, -32603, str(e)))

        except ConnectionError:
            logger.info("MCP client disconnected")
        except asyncio.CancelledError:
            pass

Functions¶

run `async` ¶

run() -> None

Main loop: read JSON-RPC from stdin, respond on stdout.

Source code in core/mcp/server.py

async def run(self) -> None:
    """Main loop: read JSON-RPC from stdin, respond on stdout."""
    reader = asyncio.StreamReader()
    protocol = asyncio.StreamReaderProtocol(reader)
    await asyncio.get_running_loop().connect_read_pipe(lambda: protocol, sys.stdin)

    write_transport, write_protocol = await asyncio.get_running_loop().connect_write_pipe(
        asyncio.streams.FlowControlMixin, sys.stdout.buffer
    )
    writer = asyncio.StreamWriter(
        write_transport, write_protocol, reader, asyncio.get_running_loop()
    )

    logger.info("MCP server ready (stdio)")
    handlers = {
        "initialize": self._handle_initialize,
        "tools/list": self._handle_tools_list,
        "tools/call": self._handle_tools_call,
    }

    try:
        while True:
            msg = await read_message(reader)

            if is_notification(msg):
                method = msg.get("method", "")
                if method == "notifications/initialized":
                    logger.info("MCP client initialized notification received")
                continue

            msg_id = msg.get("id")
            method = msg.get("method", "")

            handler = handlers.get(method)
            if handler is None:
                await write_message(
                    writer, build_error(msg_id, -32601, f"Method not found: {method}")
                )
                continue

            try:
                result = await handler(msg)
                if isinstance(result, dict) and "jsonrpc" in result:
                    await write_message(writer, result)
                else:
                    await write_message(writer, build_response(msg_id or 0, result))
            except Exception as e:
                logger.exception(f"MCP handler '{method}' error")
                await write_message(writer, build_error(msg_id, -32603, str(e)))

    except ConnectionError:
        logger.info("MCP client disconnected")
    except asyncio.CancelledError:
        pass

Functions¶

run_mcp_server ¶

run_mcp_server() -> None

Entry point for 'morphix mcp-server'.

Source code in core/mcp/server.py

def run_mcp_server() -> None:
    """Entry point for 'morphix mcp-server'."""
    logging.basicConfig(
        level=logging.WARNING,
        format="%(asctime)s - %(levelname)s - %(name)s - %(message)s",
        stream=sys.stderr,
    )
    # Load global tools so they're available in the registry
    from tools.loader import load_global_tools

    load_global_tools()

    server = MCPServer()
    asyncio.run(server.run())

core.mcp.client ¶

MCP client — connect to external MCP servers, discover and proxy their tools.

Classes¶

MCPClient ¶

Manages one MCP server connection (subprocess via stdio).

Source code in core/mcp/client.py

class MCPClient:
    """Manages one MCP server connection (subprocess via stdio)."""

    def __init__(self, config: MCPServerConfig):
        self.config = config
        self.process: asyncio.subprocess.Process | None = None
        self._request_id = 0
        self._pending: dict[int | str, asyncio.Future] = {}
        self._reader_task: asyncio.Task | None = None
        self._tools: dict[str, dict] = {}  # tool_name -> schema
        self._initialized = False

    async def connect(self, register_tools: bool = True) -> bool:
        """Spawn the MCP server subprocess and perform initialization handshake."""
        if self.process is not None:
            return True

        env = os.environ.copy()
        env.update(self.config.env)

        try:
            self.process = await asyncio.create_subprocess_exec(
                self.config.command,
                *self.config.args,
                stdin=asyncio.subprocess.PIPE,
                stdout=asyncio.subprocess.PIPE,
                stderr=asyncio.subprocess.PIPE,
                env=env,
            )
        except FileNotFoundError:
            logger.error(
                f"MCP server '{self.config.name}': command not found: {self.config.command}"
            )
            return False
        except Exception:
            logger.exception(f"MCP server '{self.config.name}': failed to start")
            return False

        # Start background reader
        self._reader_task = asyncio.create_task(self._read_loop())

        # Initialize handshake
        try:
            result = await self._send_request(
                "initialize",
                {
                    "protocolVersion": "2024-11-05",
                    "capabilities": {},
                    "clientInfo": {"name": "morphix", "version": "1.0"},
                },
            )
            logger.info(
                f"MCP server '{self.config.name}' initialized: "
                f"{result.get('serverInfo', {}).get('name', 'unknown')} "
                f"v{result.get('protocolVersion', '?')}"
            )
        except Exception as e:
            logger.error(f"MCP server '{self.config.name}' init failed: {e}")
            await self.disconnect()
            return False

        # Send initialized notification
        try:
            stdin = self.process.stdin
            if stdin is None:
                logger.error(f"MCP server '{self.config.name}' has no stdin stream")
                return False
            await write_message(
                stdin,
                build_notification("notifications/initialized"),
            )
        except Exception:
            logger.warning(f"MCP server '{self.config.name}' initialized notification failed")

        # Discover tools
        try:
            result = await self._send_request("tools/list", {})
            tools = result.get("tools", [])
            for tool in tools:
                full_name = f"mcp:{self.config.tools_prefix}.{tool['name']}"
                self._tools[tool["name"]] = mcp_tool_to_morphix_params(tool)
                self._tools[tool["name"]]["full_name"] = full_name
            logger.info(f"MCP server '{self.config.name}': {len(tools)} tool(s) discovered")
        except Exception as e:
            logger.error(f"MCP server '{self.config.name}' tools/list failed: {e}")
            await self.disconnect()
            return False

        # Register tools in Morphix tool registry
        if register_tools:
            await self._register_discovered_tools()

        self._initialized = True
        return True

    async def _register_discovered_tools(self) -> None:
        """Register discovered MCP tools in Morphix tools_registry."""
        from tools.registry import tools_registry
        from tools.specs import TOOL_DEFINITIONS, ToolDefinition

        for native_name, params in self._tools.items():
            full_name = params.get("full_name", f"mcp:{self.config.tools_prefix}.{native_name}")
            # Sanitize: DeepSeek strict mode rejects : and . in tool names
            sanitized_name = full_name.replace(":", "_").replace(".", "_")
            description = f"[MCP:{self.config.name}] {params.get('description', '')}"

            # Create a closure that calls this client for the specific tool
            client_ref = self
            tool_native_name = native_name

            async def _mcp_proxy(
                _native=tool_native_name,
                _client=client_ref,
                **kwargs,
            ):
                return await _client.call_tool(_native, kwargs)

            _mcp_proxy.__name__ = sanitized_name

            # Register in tool specs with SANITIZED name for OpenAI function-calling
            TOOL_DEFINITIONS[sanitized_name] = ToolDefinition(
                name=sanitized_name,
                description=description,
                parameters=params.get("parameters", {}),
                required=params.get("required", []),
            )

            # Register callable under sanitized name (primary)
            tools_registry.register(sanitized_name)(_mcp_proxy)
            # Also register with original full name as alias
            if full_name != sanitized_name and full_name not in tools_registry.list_tools():
                tools_registry.register(full_name)(_mcp_proxy)
            # Also register with native short name as alias
            if native_name not in tools_registry.list_tools():
                tools_registry.register(native_name)(_mcp_proxy)
            logger.debug(f"MCP tool registered: {sanitized_name}")

    async def call_tool(self, name: str, arguments: dict) -> dict:
        """Call a tool on the MCP server. Returns Morphix-format result dict."""
        if not self._initialized:
            return {
                "success": False,
                "error": "mcp_not_connected",
                "output": f"MCP server '{self.config.name}' not connected",
            }

        # Strip mcp: prefix to get the native tool name
        native_name = name.split(".", 1)[-1] if "." in name else name

        try:
            result = await self._send_request(
                "tools/call",
                {"name": native_name, "arguments": arguments},
            )
            return mcp_result_to_morphix(result)
        except Exception as e:
            return {
                "success": False,
                "error": "mcp_tool_error",
                "output": f"MCP tool '{name}' error: {e}",
            }

    async def _send_request(self, method: str, params: dict, timeout: float = 30.0) -> dict:
        if self.process is None or self.process.stdin is None:
            raise ConnectionError("MCP client not connected")

        self._request_id += 1
        msg_id = self._request_id
        future: asyncio.Future = asyncio.get_running_loop().create_future()
        self._pending[msg_id] = future

        await write_message(self.process.stdin, build_request(msg_id, method, params))

        try:
            return await asyncio.wait_for(future, timeout=timeout)
        finally:
            self._pending.pop(msg_id, None)

    async def _read_loop(self) -> None:
        """Background task: read responses from server stdout and resolve futures."""
        if self.process is None or self.process.stdout is None:
            return
        try:
            while True:
                msg = await read_message(self.process.stdout)
                if is_response(msg):
                    msg_id = get_id(msg)
                    if msg_id is not None and msg_id in self._pending:
                        if "error" in msg:
                            self._pending[msg_id].set_exception(
                                RuntimeError(msg["error"].get("message", "MCP error"))
                            )
                        else:
                            self._pending[msg_id].set_result(msg.get("result", {}))
        except ConnectionError:
            logger.info(f"MCP server '{self.config.name}' stream closed")
        except asyncio.CancelledError:
            pass
        except Exception:
            logger.exception(f"MCP server '{self.config.name}' read loop error")

    async def disconnect(self) -> None:
        """Terminate the MCP server subprocess."""
        if self._reader_task is not None:
            self._reader_task.cancel()
            self._reader_task = None

        # Reject all pending futures
        for _msg_id, future in self._pending.items():
            if not future.done():
                future.set_exception(ConnectionError("MCP client disconnected"))
        self._pending.clear()

        if self.process is not None:
            try:
                self.process.terminate()
                await asyncio.wait_for(self.process.wait(), timeout=3.0)
            except (ProcessLookupError, TimeoutError):
                try:
                    self.process.kill()
                except ProcessLookupError:
                    pass
        self.process = None
        self._initialized = False
        self._tools.clear()
        logger.info(f"MCP server '{self.config.name}' disconnected")

    @property
    def tools(self) -> dict[str, dict]:
        return self._tools

Functions¶

connect `async` ¶

connect(register_tools: bool = True) -> bool

Spawn the MCP server subprocess and perform initialization handshake.

Source code in core/mcp/client.py

async def connect(self, register_tools: bool = True) -> bool:
    """Spawn the MCP server subprocess and perform initialization handshake."""
    if self.process is not None:
        return True

    env = os.environ.copy()
    env.update(self.config.env)

    try:
        self.process = await asyncio.create_subprocess_exec(
            self.config.command,
            *self.config.args,
            stdin=asyncio.subprocess.PIPE,
            stdout=asyncio.subprocess.PIPE,
            stderr=asyncio.subprocess.PIPE,
            env=env,
        )
    except FileNotFoundError:
        logger.error(
            f"MCP server '{self.config.name}': command not found: {self.config.command}"
        )
        return False
    except Exception:
        logger.exception(f"MCP server '{self.config.name}': failed to start")
        return False

    # Start background reader
    self._reader_task = asyncio.create_task(self._read_loop())

    # Initialize handshake
    try:
        result = await self._send_request(
            "initialize",
            {
                "protocolVersion": "2024-11-05",
                "capabilities": {},
                "clientInfo": {"name": "morphix", "version": "1.0"},
            },
        )
        logger.info(
            f"MCP server '{self.config.name}' initialized: "
            f"{result.get('serverInfo', {}).get('name', 'unknown')} "
            f"v{result.get('protocolVersion', '?')}"
        )
    except Exception as e:
        logger.error(f"MCP server '{self.config.name}' init failed: {e}")
        await self.disconnect()
        return False

    # Send initialized notification
    try:
        stdin = self.process.stdin
        if stdin is None:
            logger.error(f"MCP server '{self.config.name}' has no stdin stream")
            return False
        await write_message(
            stdin,
            build_notification("notifications/initialized"),
        )
    except Exception:
        logger.warning(f"MCP server '{self.config.name}' initialized notification failed")

    # Discover tools
    try:
        result = await self._send_request("tools/list", {})
        tools = result.get("tools", [])
        for tool in tools:
            full_name = f"mcp:{self.config.tools_prefix}.{tool['name']}"
            self._tools[tool["name"]] = mcp_tool_to_morphix_params(tool)
            self._tools[tool["name"]]["full_name"] = full_name
        logger.info(f"MCP server '{self.config.name}': {len(tools)} tool(s) discovered")
    except Exception as e:
        logger.error(f"MCP server '{self.config.name}' tools/list failed: {e}")
        await self.disconnect()
        return False

    # Register tools in Morphix tool registry
    if register_tools:
        await self._register_discovered_tools()

    self._initialized = True
    return True

call_tool `async` ¶

call_tool(name: str, arguments: dict) -> dict

Call a tool on the MCP server. Returns Morphix-format result dict.

Source code in core/mcp/client.py

async def call_tool(self, name: str, arguments: dict) -> dict:
    """Call a tool on the MCP server. Returns Morphix-format result dict."""
    if not self._initialized:
        return {
            "success": False,
            "error": "mcp_not_connected",
            "output": f"MCP server '{self.config.name}' not connected",
        }

    # Strip mcp: prefix to get the native tool name
    native_name = name.split(".", 1)[-1] if "." in name else name

    try:
        result = await self._send_request(
            "tools/call",
            {"name": native_name, "arguments": arguments},
        )
        return mcp_result_to_morphix(result)
    except Exception as e:
        return {
            "success": False,
            "error": "mcp_tool_error",
            "output": f"MCP tool '{name}' error: {e}",
        }

disconnect `async` ¶

disconnect() -> None

Terminate the MCP server subprocess.

Source code in core/mcp/client.py

async def disconnect(self) -> None:
    """Terminate the MCP server subprocess."""
    if self._reader_task is not None:
        self._reader_task.cancel()
        self._reader_task = None

    # Reject all pending futures
    for _msg_id, future in self._pending.items():
        if not future.done():
            future.set_exception(ConnectionError("MCP client disconnected"))
    self._pending.clear()

    if self.process is not None:
        try:
            self.process.terminate()
            await asyncio.wait_for(self.process.wait(), timeout=3.0)
        except (ProcessLookupError, TimeoutError):
            try:
                self.process.kill()
            except ProcessLookupError:
                pass
    self.process = None
    self._initialized = False
    self._tools.clear()
    logger.info(f"MCP server '{self.config.name}' disconnected")

Functions¶

connect_mcp_servers `async` ¶

connect_mcp_servers(workspace: str) -> None

Connect to all MCP servers configured for a workspace.

Source code in core/mcp/client.py

async def connect_mcp_servers(workspace: str) -> None:
    """Connect to all MCP servers configured for a workspace."""
    from core.mcp.config import load_mcp_servers

    configs = load_mcp_servers(workspace)
    for cfg in configs:
        if cfg.name in _clients:
            continue
        client = MCPClient(cfg)
        if await client.connect():
            _clients[cfg.name] = client

disconnect_mcp_servers `async` ¶

disconnect_mcp_servers() -> None

Disconnect all MCP clients.

Source code in core/mcp/client.py

async def disconnect_mcp_servers() -> None:
    """Disconnect all MCP clients."""
    for name in list(_clients):
        await _clients[name].disconnect()
    _clients.clear()

get_mcp_client_for_tool ¶

get_mcp_client_for_tool(tool_name: str) -> MCPClient | None

Find the MCP client that owns a given tool name (mcp:.name).

Source code in core/mcp/client.py

def get_mcp_client_for_tool(tool_name: str) -> "MCPClient | None":
    """Find the MCP client that owns a given tool name (mcp:<prefix>.name)."""
    if not tool_name.startswith("mcp:"):
        return None
    prefix = tool_name[4:].rsplit(".", 1)[0] if "." in tool_name else tool_name[4:]
    for client in _clients.values():
        if client.config.tools_prefix == prefix:
            return client
    return None

core.mcp.config ¶

Load MCP server configurations from JSON files.

Functions¶

load_mcp_servers ¶

load_mcp_servers(
    workspace: str | None = None,
) -> list[MCPServerConfig]

Load MCP server configs. Workspace-local overrides global.

Source code in core/mcp/config.py

def load_mcp_servers(workspace: str | None = None) -> list[MCPServerConfig]:
    """Load MCP server configs. Workspace-local overrides global."""
    from core.path_resolver import paths

    servers: dict[str, MCPServerConfig] = {}

    # Global config
    global_file = Path(__file__).parent.parent.parent / "mcp_servers.json"
    for cfg in _load_file(global_file):
        servers[cfg.name] = cfg

    # Workspace-local config (overrides same-named servers)
    if workspace:
        ws_file = paths.mcp_servers_file(workspace)
        for cfg in _load_file(ws_file):
            servers[cfg.name] = cfg

    return [s for s in servers.values() if s.enabled]

core.mcp.adapter ¶

Convert between Morphix ToolDefinition and MCP tool schema.

MCP tool format

{"name": "...", "description": "...", "inputSchema": {"type": "object", "properties": {...}, "required": [...]}}

Morphix tools use OpenAI function-calling format — we convert at the bridge.

Functions¶

morphix_to_mcp_tool ¶

morphix_to_mcp_tool(tool: dict[str, Any]) -> dict[str, Any]

Convert a Morphix tool dict to MCP tool format.

Input: {"name": "...", "description": "...", "parameters": {...}, "required": [...]} Output: {"name": "...", "description": "...", "inputSchema": {"type": "object", "properties": {...}, "required": [...]}}

Source code in core/mcp/adapter.py

def morphix_to_mcp_tool(tool: dict[str, Any]) -> dict[str, Any]:
    """Convert a Morphix tool dict to MCP tool format.

    Input: {"name": "...", "description": "...", "parameters": {...}, "required": [...]}
    Output: {"name": "...", "description": "...", "inputSchema": {"type": "object", "properties": {...}, "required": [...]}}
    """
    return {
        "name": tool["name"],
        "description": tool.get("description", ""),
        "inputSchema": {
            "type": "object",
            "properties": tool.get("parameters", {}),
            "required": tool.get("required", []),
        },
    }

mcp_tool_to_morphix_params ¶

mcp_tool_to_morphix_params(
    mcp_tool: dict[str, Any],
) -> dict[str, Any]

Extract Morphix-compatible params from an MCP tool schema.

Returns a dict suitable for tools_registry + tool_specs registration.

Source code in core/mcp/adapter.py

def mcp_tool_to_morphix_params(mcp_tool: dict[str, Any]) -> dict[str, Any]:
    """Extract Morphix-compatible params from an MCP tool schema.

    Returns a dict suitable for tools_registry + tool_specs registration.
    """
    input_schema = mcp_tool.get("inputSchema", {})
    return {
        "name": mcp_tool["name"],
        "description": mcp_tool.get("description", ""),
        "parameters": input_schema.get("properties", {}),
        "required": input_schema.get("required", []),
    }

mcp_result_to_morphix ¶

mcp_result_to_morphix(
    result: dict[str, Any],
) -> dict[str, Any]

Convert MCP tools/call result to Morphix tool output format.

MCP content: [{"type": "text", "text": "..."}, {"type": "image", "data": "...", "mimeType": "..."}] Morphix expects: {"success": bool, "output": str, ...}

Source code in core/mcp/adapter.py

def mcp_result_to_morphix(result: dict[str, Any]) -> dict[str, Any]:
    """Convert MCP tools/call result to Morphix tool output format.

    MCP content: [{"type": "text", "text": "..."}, {"type": "image", "data": "...", "mimeType": "..."}]
    Morphix expects: {"success": bool, "output": str, ...}
    """
    content = result.get("content", [])
    text_parts = []
    for item in content:
        if item.get("type") == "text":
            text_parts.append(item.get("text", ""))
        elif item.get("type") == "image":
            text_parts.append(f"[image: {item.get('mimeType', 'unknown')}]")
    return {
        "success": not result.get("isError", False),
        "output": "\n".join(text_parts),
        "raw": result,
    }

core.mcp.protocol ¶

JSON-RPC 2.0 framing over asyncio streams.

MCP uses JSON-RPC 2.0 with newline-delimited JSON over stdio. Messages are one JSON object per line (no pretty-print, no embedded newlines).

Functions¶

read_message `async` ¶

read_message(
    stream: asyncio.StreamReader,
) -> dict[str, Any]

Read one newline-delimited JSON message from a stream.

Source code in core/mcp/protocol.py

async def read_message(stream: asyncio.StreamReader) -> dict[str, Any]:
    """Read one newline-delimited JSON message from a stream."""
    line = await stream.readline()
    if not line:
        raise ConnectionError("MCP stream closed by remote")
    try:
        return json.loads(line.decode("utf-8"))
    except json.JSONDecodeError as e:
        logger.warning(f"MCP JSON parse error: {e} | raw: {line[:200]!r}")
        raise

write_message `async` ¶

write_message(
    stream: asyncio.StreamWriter, data: dict[str, Any]
) -> None

Write one JSON message as a single line to a stream.

Source code in core/mcp/protocol.py

async def write_message(stream: asyncio.StreamWriter, data: dict[str, Any]) -> None:
    """Write one JSON message as a single line to a stream."""
    encoded = json.dumps(data, ensure_ascii=False).encode("utf-8") + b"\n"
    stream.write(encoded)
    await stream.drain()

core.security.anti_distillation ¶

Anti-distillation hardening — watermark rotation, pattern detection, escalation.

Companion to undercover_mode.py. Provides: 1. Watermark rotation — 8 styles, rotated per workspace+time seed 2. Query similarity tracking — detects N similar queries (extraction pattern) 3. Escalation levels — warn → throttle → honeypot → lock 4. Honeypot generator — fake system prompts to waste attackers