AI_Diplomacy/ai_diplomacy/game_logic.py

# ai_diplomacy/game_logic.py
import logging
import os
import json
import asyncio
from typing import Dict, List, Tuple, Optional, Any
from argparse import Namespace

from diplomacy import Game
from diplomacy.utils.export import to_saved_game_format, from_saved_game_format

from .agent import DiplomacyAgent, ALL_POWERS
from .clients import load_model_client
from .game_history import GameHistory
from .initialization import initialize_agent_state_ext
from .utils import atomic_write_json, assign_models_to_powers

logger = logging.getLogger(__name__)

# --- Serialization / Deserialization ---

def serialize_agent(agent: DiplomacyAgent) -> dict:
    """Converts an agent object to a JSON-serializable dictionary."""
    return {
        "power_name": agent.power_name,
        "model_id": agent.client.model_name,
        "max_tokens": agent.client.max_tokens,
        "goals": agent.goals,
        "relationships": agent.relationships,
        "full_private_diary": agent.full_private_diary,
        "private_diary": agent.private_diary,
    }

def deserialize_agent(agent_data: dict, prompts_dir: Optional[str] = None) -> DiplomacyAgent:
    """Recreates an agent object from a dictionary."""
    client = load_model_client(agent_data["model_id"], prompts_dir=prompts_dir)
    client.max_tokens = agent_data.get("max_tokens", 16000) # Default for older saves

    agent = DiplomacyAgent(
        power_name=agent_data["power_name"],
        client=client,
        initial_goals=agent_data.get("goals", []),
        initial_relationships=agent_data.get("relationships", None),
        prompts_dir=prompts_dir
    )
    # Restore the diary.
    agent.full_private_diary = agent_data.get("full_private_diary", [])
    agent.private_diary = agent_data.get("private_diary", [])

    return agent

# --- State Management ---

# game_logic.py
_PHASE_ORDER = ["M", "R", "A"]          # Movement → Retreats → Adjustments

def _next_phase_name(short: str) -> str:
    """
    Return the Diplomacy phase string that chronologically follows *short*.
    (E.g.  S1901M → S1901R,  S1901R → W1901A,  W1901A → S1902M)
    """
    season = short[0]                   # 'S' | 'W'
    year   = int(short[1:5])
    typ    = short[-1]                  # 'M' | 'R' | 'A'

    idx = _PHASE_ORDER.index(typ)
    if idx < 2:                         # still in the same season
        return f"{season}{year}{_PHASE_ORDER[idx+1]}"

    # typ was 'A'  → roll season
    if season == "S":                   # summer → winter, same year
        return f"W{year}M"
    else:                               # winter→ spring, next year
        return f"S{year+1}M"

def save_game_state(
    game: Game,
    agents: Dict[str, DiplomacyAgent],
    game_history: GameHistory,
    output_path: str,
    run_config: Namespace,
    completed_phase_name: str
):
    """
    Serialise the entire game to JSON, preserving per-phase custom metadata
    (e.g. 'state_agents') that may have been written by earlier save passes.
    """
    logger.info(f"Saving game state to {output_path}…")

    # ------------------------------------------------------------------ #
    # 1.  If the file already exists, cache the per-phase custom blocks. #
    # ------------------------------------------------------------------ #
    previous_phase_extras: Dict[str, Dict[str, Any]] = {}
    if os.path.isfile(output_path):
        try:
            with open(output_path, "r", encoding="utf-8") as fh:
                previous_save = json.load(fh)
            for phase in previous_save.get("phases", []):
                # Keep a copy of *all* non-standard keys so that future
                # additions survive automatically.
                extras = {
                    k: v
                    for k, v in phase.items()
                    if k
                    not in {
                        "name",
                        "orders",
                        "results",
                        "messages",
                        "state",
                        "config",
                    }
                }
                if extras:
                    previous_phase_extras[phase["name"]] = extras
        except Exception as exc:
            logger.warning(
                "Could not load previous save to retain metadata: %s", exc, exc_info=True
            )

    # -------------------------------------------------------------- #
    # 2.  Build the fresh base structure from the diplomacy library. #
    # -------------------------------------------------------------- #
    saved_game = to_saved_game_format(game)

    # -------------------------------------------------------------- #
    # 3.  Walk every phase and merge the metadata back in.           #
    # -------------------------------------------------------------- #
    # Capture the *current* snapshot of every live agent exactly once.
    current_state_agents = {
        p_name: serialize_agent(p_agent)
        for p_name, p_agent in agents.items()
        if not game.powers[p_name].is_eliminated()
    }

    for phase_block in saved_game.get("phases", []):
        if int(phase_block["name"][1:5]) > run_config.max_year:
            break

        phase_name = phase_block["name"]

        # 3a.  Re-attach anything we cached from a previous save.
        if phase_name in previous_phase_extras:
            phase_block.update(previous_phase_extras[phase_name])

        # 3b.  For *this* phase we also inject the fresh agent snapshot
        #      and the plans written during the turn.
        if phase_name == completed_phase_name:
            phase_block["config"] = vars(run_config)
            phase_block["state_agents"] = current_state_agents

            # Plans for this phase – may be empty in non-movement phases.
            phase_obj = game_history._get_phase(phase_name)
            phase_block["state_history_plans"] = (
                phase_obj.plans if phase_obj else {}
            )


    # -------------------------------------------------------------- #
    # 4.  Attach top-level metadata and write atomically.            #
    # -------------------------------------------------------------- #
    saved_game["phase_summaries"] = getattr(game, "phase_summaries", {})
    saved_game["final_agent_states"] = {
        p_name: {"relationships": a.relationships, "goals": a.goals}
        for p_name, a in agents.items()
    }

    # Filter out phases > max_year
    #saved_game["phases"] = [
    #    ph for ph in saved_game["phases"]
    #    if int(ph["name"][1:5]) <= run_config.max_year        # <= 1902, for example
    #]
    atomic_write_json(saved_game, output_path)

    logger.info("Game state saved successfully.")


def load_game_state(
    run_dir: str,
    game_file_name: str,
    resume_from_phase: Optional[str] = None
) -> Tuple[Game, Dict[str, DiplomacyAgent], GameHistory, Optional[Namespace]]:
    """Loads and reconstructs the game state from a saved game file."""
    game_file_path = os.path.join(run_dir, game_file_name)
    if not os.path.exists(game_file_path):
        raise FileNotFoundError(f"Cannot resume. Save file not found at: {game_file_path}")

    logger.info(f"Loading game state from: {game_file_path}")
    with open(game_file_path, 'r') as f:
        saved_game_data = json.load(f)

    # Find the latest config saved in the file
    run_config = None
    if saved_game_data.get("phases"):
        for phase in reversed(saved_game_data["phases"]):
            if "config" in phase:
                run_config = Namespace(**phase["config"])
                logger.info(f"Loaded run configuration from phase {phase['name']}.")
                break

    # If resuming, find the specified phase and truncate the data after it
    if resume_from_phase:
        logger.info(f"Resuming from phase '{resume_from_phase}'. Truncating subsequent data.")
        try:
            # Find the index of the phase *before* the one we want to resume from.
            # We will start the simulation *at* the resume_from_phase.
            resume_idx = next(i for i, phase in enumerate(saved_game_data['phases']) if phase['name'] == resume_from_phase)
            # Truncate the list to exclude everything after the resume phase
            # Note: the state saved for a given phase represents the state at the beginning of that phase.
            saved_game_data['phases'] = saved_game_data['phases'][:resume_idx+1]

            # Wipe any data that must be regenerated.
            for key in ("orders", "results", "messages"):
                saved_game_data['phases'][-1].pop(key, None)
            logger.info(f"Game history truncated to {len(saved_game_data['phases'])} phases. The next phase to run will be {resume_from_phase}.")
        except StopIteration:
            # If the phase is not found, maybe it's the first phase (S1901M)
            if resume_from_phase == "S1901M":
                 saved_game_data['phases'] = []
                 logger.info("Resuming from S1901M. Starting with a clean history.")
            else:
                raise ValueError(f"Resume phase '{resume_from_phase}' not found in the save file.")

    # Reconstruct the Game object
    last_phase = saved_game_data['phases'][-1]

    # Wipe the data that must be regenerated **but preserve the keys**
    last_phase['orders']   = {}   # was dict
    last_phase['results']  = {}   # was dict
    last_phase['messages'] = []

    game = from_saved_game_format(saved_game_data)

    game.phase_summaries = saved_game_data.get('phase_summaries', {})

    # Reconstruct agents and game history from the *last* valid phase in the data
    if not saved_game_data['phases']:
        # This happens if we are resuming from the very beginning (S1901M)
        logger.info("No previous phases found. Initializing fresh agents and history.")
        agents = {} # Will be created by the main loop
        game_history = GameHistory()
    else:
        # We save the game state up to & including the current (uncompleted) phase.
        # So we need to grab the agent state from the previous (completed) phase.
        if len(saved_game_data['phases']) <= 1:
            last_phase_data = {}
        else:
            last_phase_data = saved_game_data['phases'][-2]

        # Rebuild agents
        agents = {}
        if 'state_agents' in last_phase_data:
            logger.info("Rebuilding agents from saved state...")
            prompts_dir_from_config = run_config.prompts_dir if run_config and hasattr(run_config, 'prompts_dir') else None
            for power_name, agent_data in last_phase_data['state_agents'].items():
                agents[power_name] = deserialize_agent(agent_data, prompts_dir=prompts_dir_from_config)
            logger.info(f"Rebuilt {len(agents)} agents.")
        else:
            raise ValueError("Cannot resume: 'state_agents' key not found in the last phase of the save file.")

        # Rebuild GameHistory
        game_history = GameHistory()
        logger.info("Rebuilding game history...")
        for phase_data in saved_game_data['phases'][:-1]:
            phase_name = phase_data['name']
            game_history.add_phase(phase_name)
            # Add messages
            for msg in phase_data.get('messages', []):
                game_history.add_message(phase_name, msg['sender'], msg['recipient'], msg['message'])
            # Add plans
            if 'state_history_plans' in phase_data:
                for p_name, plan in phase_data['state_history_plans'].items():
                    game_history.add_plan(phase_name, p_name, plan)
        logger.info("Game history rebuilt.")


    return game, agents, game_history, run_config


async def initialize_new_game(
    args: Namespace,
    game: Game,
    game_history: GameHistory,
    llm_log_file_path: str
) -> Dict[str, DiplomacyAgent]:
    """Initializes agents for a new game."""
    powers_order = sorted(list(ALL_POWERS))

    # Parse token limits
    default_max_tokens = args.max_tokens
    model_max_tokens = {p: default_max_tokens for p in powers_order}

    if args.max_tokens_per_model:
        per_model_values = [s.strip() for s in args.max_tokens_per_model.split(",")]
        if len(per_model_values) == 7:
            for power, token_val_str in zip(powers_order, per_model_values):
                model_max_tokens[power] = int(token_val_str)
        else:
            logger.warning("Expected 7 values for --max_tokens_per_model, using default.")

    # Handle power model mapping
    if args.models:
        provided_models = [name.strip() for name in args.models.split(",")]
        if len(provided_models) == len(powers_order):
            game.power_model_map = dict(zip(powers_order, provided_models))
        else:
            logger.error(f"Expected {len(powers_order)} models for --models but got {len(provided_models)}. Using defaults.")
            game.power_model_map = assign_models_to_powers()
    else:
        game.power_model_map = assign_models_to_powers()

    agents = {}
    initialization_tasks = []
    logger.info("Initializing Diplomacy Agents for each power...")
    for power_name, model_id in game.power_model_map.items():
        if not game.powers[power_name].is_eliminated():
            try:
                client = load_model_client(model_id, prompts_dir=args.prompts_dir)
                client.max_tokens = model_max_tokens[power_name]
                agent = DiplomacyAgent(power_name=power_name, client=client, prompts_dir=args.prompts_dir)
                agents[power_name] = agent
                logger.info(f"Preparing initialization task for {power_name} with model {model_id}")
                initialization_tasks.append(initialize_agent_state_ext(agent, game, game_history, llm_log_file_path, prompts_dir=args.prompts_dir))
            except Exception as e:
                logger.error(f"Failed to create agent or client for {power_name} with model {model_id}: {e}", exc_info=True)

    logger.info(f"Running {len(initialization_tasks)} agent initializations concurrently...")
    initialization_results = await asyncio.gather(*initialization_tasks, return_exceptions=True)

    initialized_powers = list(agents.keys())
    for i, result in enumerate(initialization_results):
         if i < len(initialized_powers):
             power_name = initialized_powers[i]
             if isinstance(result, Exception):
                 logger.error(f"Failed to initialize agent state for {power_name}: {result}", exc_info=result)
             else:
                 logger.info(f"Successfully initialized agent state for {power_name}.")

    return agents