evotraders/backend/agents/prompts/builder.py

# -*- coding: utf-8 -*-
"""PromptBuilder for constructing system prompts from workspace markdown files.

Based on CoPaw design - loads AGENTS.md, SOUL.md, PROFILE.md, etc. from
agent workspace directories with YAML frontmatter support.
"""
from __future__ import annotations

import logging
from pathlib import Path
from typing import Any, Dict, List, Optional

import yaml

logger = logging.getLogger(__name__)

DEFAULT_SYS_PROMPT = """You are a helpful trading analysis assistant."""


class PromptBuilder:
    """Builder for constructing system prompts from markdown files.

    Loads markdown configuration files from agent workspace directories,
    supporting YAML frontmatter for metadata extraction.
    """

    DEFAULT_FILES = [
        "AGENTS.md",
        "SOUL.md",
        "PROFILE.md",
        "POLICY.md",
        "MEMORY.md",
    ]

    TITLE_MAP: Dict[str, str] = {
        "AGENTS.md": "Agent Guide",
        "SOUL.md": "Soul",
        "PROFILE.md": "Profile",
        "POLICY.md": "Policy",
        "MEMORY.md": "Memory",
        "BOOTSTRAP.md": "Bootstrap",
    }

    def __init__(
        self,
        workspace_dir: Path,
        enabled_files: Optional[List[str]] = None,
    ):
        """Initialize prompt builder.

        Args:
            workspace_dir: Directory containing markdown configuration files
            enabled_files: List of filenames to load (if None, uses defaults)
        """
        self.workspace_dir = Path(workspace_dir)
        self.enabled_files = enabled_files or self.DEFAULT_FILES.copy()
        self._prompt_parts: List[str] = []
        self._metadata: Dict[str, Any] = {}
        self.loaded_count = 0

    def _load_file(self, filename: str) -> tuple[str, Optional[Dict[str, Any]]]:
        """Load a single markdown file with YAML frontmatter support.

        Args:
            filename: Name of the file to load

        Returns:
            Tuple of (content, metadata dict or None)
        """
        file_path = self.workspace_dir / filename

        if not file_path.exists():
            logger.debug("File %s not found in %s, skipping", filename, self.workspace_dir)
            return "", None

        try:
            raw_content = file_path.read_text(encoding="utf-8").strip()

            if not raw_content:
                logger.debug("Skipped empty file: %s", filename)
                return "", None

            content, metadata = self._parse_frontmatter(raw_content)

            if content:
                self.loaded_count += 1
                logger.debug("Loaded %s (metadata: %s)", filename, bool(metadata))

            return content, metadata

        except Exception as e:
            logger.warning("Failed to read file %s: %s, skipping", filename, e)
            return "", None

    def _parse_frontmatter(self, raw_content: str) -> tuple[str, Optional[Dict[str, Any]]]:
        """Parse YAML frontmatter from markdown content.

        Args:
            raw_content: Raw file content

        Returns:
            Tuple of (content without frontmatter, metadata dict or None)
        """
        if not raw_content.startswith("---"):
            return raw_content, None

        parts = raw_content.split("---", 2)
        if len(parts) < 3:
            return raw_content, None

        frontmatter = parts[1].strip()
        content = parts[2].strip()

        try:
            metadata = yaml.safe_load(frontmatter) or {}
            if not isinstance(metadata, dict):
                metadata = {}
            return content, metadata
        except yaml.YAMLError as e:
            logger.warning("Failed to parse YAML frontmatter: %s", e)
            return content, None

    def _append_section(self, title: str, content: str) -> None:
        """Append a section to the prompt parts.

        Args:
            title: Section title
            content: Section content
        """
        content = content.strip()
        if not content:
            return

        if self._prompt_parts:
            self._prompt_parts.append("")

        self._prompt_parts.append(f"## {title}")
        self._prompt_parts.append("")
        self._prompt_parts.append(content)

    def build(self) -> str:
        """Build the system prompt from markdown files.

        Returns:
            Constructed system prompt string
        """
        self._prompt_parts = []
        self._metadata = {}
        self.loaded_count = 0

        for filename in self.enabled_files:
            content, metadata = self._load_file(filename)

            if metadata:
                self._metadata[filename] = metadata

            if content:
                title = self.TITLE_MAP.get(filename, filename.replace(".md", ""))
                self._append_section(title, content)

        if not self._prompt_parts:
            logger.warning("No content loaded from workspace: %s", self.workspace_dir)
            return DEFAULT_SYS_PROMPT

        final_prompt = "\n".join(self._prompt_parts)

        logger.debug(
            "System prompt built from %d file(s), total length: %d chars",
            self.loaded_count,
            len(final_prompt),
        )

        return final_prompt

    def get_metadata(self) -> Dict[str, Any]:
        """Get metadata collected from YAML frontmatter.

        Returns:
            Dictionary mapping filenames to their metadata
        """
        return self._metadata.copy()

    def get_agent_identity(self) -> Optional[Dict[str, Any]]:
        """Extract agent identity from PROFILE.md metadata.

        Returns:
            Identity dict with name, role, etc. or None
        """
        profile_meta = self._metadata.get("PROFILE.md", {})
        if not profile_meta:
            return None

        return {
            "name": profile_meta.get("name", "Unknown"),
            "role": profile_meta.get("role", ""),
            "expertise": profile_meta.get("expertise", []),
            "style": profile_meta.get("style", ""),
        }


def build_system_prompt_from_workspace(
    workspace_dir: Path,
    enabled_files: Optional[List[str]] = None,
    agent_id: Optional[str] = None,
    extra_context: Optional[str] = None,
) -> str:
    """Build system prompt from workspace markdown files.

    This is the main entry point for building system prompts from
    agent workspace directories.

    Args:
        workspace_dir: Directory containing markdown configuration files
        enabled_files: List of filenames to load (if None, uses defaults)
        agent_id: Agent identifier to include in system prompt
        extra_context: Additional context to append to the prompt

    Returns:
        Constructed system prompt string
    """
    builder = PromptBuilder(
        workspace_dir=workspace_dir,
        enabled_files=enabled_files,
    )

    prompt = builder.build()

    # Add agent identity header if agent_id provided
    if agent_id and agent_id != "default":
        identity_header = (
            f"# Agent Identity\n\n"
            f"Your agent ID is `{agent_id}`. "
            f"This is your unique identifier in the multi-agent system.\n\n"
        )
        prompt = identity_header + prompt

    # Append extra context if provided
    if extra_context:
        prompt = prompt + "\n\n" + extra_context

    return prompt


def build_bootstrap_guidance(language: str = "zh") -> str:
    """Build bootstrap guidance message for first-time setup.

    Args:
        language: Language code (zh/en)

    Returns:
        Formatted bootstrap guidance message
    """
    if language == "zh":
        return (
            "# 引导模式\n"
            "\n"
            "工作目录中存在 `BOOTSTRAP.md` — 首次设置。\n"
            "\n"
            "1. 阅读 BOOTSTRAP.md，友好地表示初次见面，"
            "引导用户完成设置。\n"
            "2. 按照 BOOTSTRAP.md 的指示，"
            "帮助用户定义你的身份和偏好。\n"
            "3. 按指南创建/更新必要文件"
            "（PROFILE.md、MEMORY.md 等）。\n"
            "4. 完成后删除 BOOTSTRAP.md。\n"
            "\n"
            "如果用户希望跳过，直接回答下面的问题即可。\n"
            "\n"
            "---\n"
            "\n"
        )

    return (
        "# BOOTSTRAP MODE\n"
        "\n"
        "`BOOTSTRAP.md` exists — first-time setup.\n"
        "\n"
        "1. Read BOOTSTRAP.md, greet the user, "
        "and guide them through setup.\n"
        "2. Follow BOOTSTRAP.md instructions "
        "to define identity and preferences.\n"
        "3. Create/update files "
        "(PROFILE.md, MEMORY.md, etc.) as described.\n"
        "4. Delete BOOTSTRAP.md when done.\n"
        "\n"
        "If the user wants to skip, answer their "
        "question directly instead.\n"
        "\n"
        "---\n"
        "\n"
    )


__all__ = [
    "PromptBuilder",
    "build_system_prompt_from_workspace",
    "build_bootstrap_guidance",
    "DEFAULT_SYS_PROMPT",
]