Revert "Merge branch 'main' into animation"

This reverts commit d7f93f587a, reversing changes made to d505c7ea6c.
2026-04-19 12:58:09 +00:00 · 2025-03-04 20:31:14 -08:00 · 2025-03-04 20:31:14 -08:00 · 0242d7446b
commit 0242d7446b
parent d7f93f587a
25 changed files with 360 additions and 2580 deletions
--- a/lm_game.py
+++ b/lm_game.py
@ -13,7 +13,7 @@ os.environ["GRPC_PYTHON_LOG_LEVEL"] = "40"  # ERROR level only
 from diplomacy import Game
 from diplomacy.utils.export import to_saved_game_format

-from ai_diplomacy.model_loader import load_model_client
+from ai_diplomacy.clients import load_model_client
 from ai_diplomacy.utils import (
    get_valid_orders,
    gather_possible_orders,
@ -22,12 +22,9 @@ from ai_diplomacy.utils import (
 from ai_diplomacy.negotiations import conduct_negotiations
 from ai_diplomacy.planning import planning_phase
 from ai_diplomacy.game_history import GameHistory
-from ai_diplomacy.long_story_short import configure_context_manager
-from ai_diplomacy.clients import configure_logging

 dotenv.load_dotenv()

-# Configure logger with a consistent format
 logger = logging.getLogger(__name__)
 logging.basicConfig(
    level=logging.INFO,
@ -35,18 +32,6 @@ logging.basicConfig(
    datefmt="%H:%M:%S",
 )

-# Configure specific loggers to reduce noise
-logging.getLogger("httpx").setLevel(logging.WARNING)
-logging.getLogger("httpcore").setLevel(logging.WARNING)
-logging.getLogger("urllib3").setLevel(logging.WARNING)
-logging.getLogger("anthropic").setLevel(logging.WARNING)
-logging.getLogger("openai").setLevel(logging.WARNING)
-
-# Ensure our application loggers are at appropriate levels
-logging.getLogger("client").setLevel(logging.INFO)
-logging.getLogger("ai_diplomacy").setLevel(logging.INFO)
-
-

 def parse_arguments():
    parser = argparse.ArgumentParser(
@ -55,13 +40,13 @@ def parse_arguments():
    parser.add_argument(
        "--max_year",
        type=int,
-        default=1910,
+        default=1901,
        help="Maximum year to simulate. The game will stop once this year is reached.",
    )
    parser.add_argument(
        "--num_negotiation_rounds",
        type=int,
-        default=5,
+        default=0,
        help="Number of negotiation rounds per phase.",
    )
    parser.add_argument(
@ -85,65 +70,15 @@ def parse_arguments():
        help="Enable the planning phase for each power to set strategic directives.",
    )
    return parser.parse_args()
- 
-
-def save_game_state(game, result_folder, game_file_path, model_error_stats, args, is_final=False):
-    """
-    Save the current game state and related information
-    
-    Args:
-        game: The diplomacy game instance
-        result_folder: Path to the results folder
-        game_file_path: Base path for the game file
-        model_error_stats: Dictionary containing model error statistics
-        args: Command line arguments
-        is_final: Boolean indicating if this is the final save
-    """
-    # Generate unique filename for periodic saves
-    timestamp = time.strftime("%Y%m%d_%H%M%S")
-    if not is_final:
-        output_path = f"{game_file_path}_checkpoint_{timestamp}.json"
-    else:
-        output_path = game_file_path
-        # If final file exists, append timestamp
-        if os.path.exists(output_path):
-            logger.info("STORAGE | Final game file already exists, saving with unique timestamp")
-            output_path = f"{output_path}_{timestamp}.json"
-    
-    # Save game state
-    to_saved_game_format(game, output_path=output_path)
-    
-    # Save overview data
-    overview_file_path = f"{result_folder}/overview.jsonl"
-    with open(overview_file_path, "w") as overview_file:
-        overview_file.write(json.dumps(model_error_stats) + "\n")
-        overview_file.write(json.dumps(game.power_model_map) + "\n")
-        overview_file.write(json.dumps(vars(args)) + "\n")
-    
-    logger.info(f"STORAGE | Game checkpoint saved to: {output_path}")


 def main():
    args = parse_arguments()
-    
-    # Configure logging
-    log_level = getattr(logging, args.log_level)
-    configure_logging(
-        log_full_prompts=args.log_full_prompts,
-        log_full_responses=args.log_full_responses,
-        suppress_connection_logs=not args.verbose,
-        log_level=log_level
-    )
-    
-    # Configure the context manager with the same summary model
-    configure_context_manager(
-        phase_threshold=15000,
-        message_threshold=15000,
-        summary_model=args.summary_model
-    )
    max_year = args.max_year

-    logger.info("GAME_START | Initializing Diplomacy game with multiple LLM agents")
+    logger.info(
+        "Starting a new Diplomacy game for testing with multiple LLMs, now concurrent!"
+    )
    start_whole = time.time()

    model_error_stats = defaultdict(
@ -163,26 +98,6 @@ def main():
    result_folder = f"./results/{timestamp_str}"
    os.makedirs(result_folder, exist_ok=True)

-    # ---------------------------
-    # ADD FILE HANDLER FOR LOGS
-    # ---------------------------
-    log_file_path = os.path.join(result_folder, "game.log")
-    file_handler = logging.FileHandler(log_file_path)
-    file_handler.setLevel(logging.DEBUG)  # Ensure we capture all levels in the file
-    file_handler.setFormatter(
-        logging.Formatter("%(asctime)s [%(levelname)s] %(name)s - %(message)s", datefmt="%H:%M:%S")
-    )
-    
-    # Add the handler to root logger to capture all modules' logs
-    logging.getLogger().addHandler(file_handler)
-    
-    # Also add to specific loggers we care about most for summarization
-    logging.getLogger("ai_diplomacy.long_story_short").addHandler(file_handler)
-    logging.getLogger("ai_diplomacy.long_story_short").setLevel(logging.DEBUG)
-    
-    logger.info(f"LOGGING | File handler configured to write logs to {log_file_path}")
-    logger.info(f"LOGGING | Capturing detailed context management logs at DEBUG level")
-
    # File paths
    manifesto_path = f"{result_folder}/game_manifesto.txt"
    # Use provided output filename or generate one based on the timestamp
@ -204,46 +119,33 @@ def main():
        provided_models = [name.strip() for name in args.models.split(",")]
        if len(provided_models) != len(powers_order):
            logger.error(
-                f"CONFIG_ERROR | Expected {len(powers_order)} models in --models argument but got {len(provided_models)}. Exiting."
+                f"Expected {len(powers_order)} models for --power-models but got {len(provided_models)}. Exiting."
            )
            return
        game.power_model_map = dict(zip(powers_order, provided_models))
    else:
-        game.power_model_map = assign_models_to_powers(randomize=True)
-
-    logger.debug("POWERS | Model assignments:")
-    for power, model_id in game.power_model_map.items():
-        logger.debug(f"POWERS | {power} assigned to {model_id}")
-
-    # Also, if you prefer to fix the negotiation function:
-    # We could do a one-liner ensuring all model_id are strings:
-    for p in game.power_model_map:
-        if not isinstance(game.power_model_map[p], str):
-            game.power_model_map[p] = str(game.power_model_map[p])
-
-    logger.debug("POWERS | Verified all power model IDs are strings")
-
-    round_counter = 0  # Track number of rounds
+        game.power_model_map = assign_models_to_powers()

    while not game.is_game_done:
        phase_start = time.time()
        current_phase = game.get_current_phase()
        logger.info(
-            f"PHASE | {current_phase} | Starting (elapsed game time: {phase_start - start_whole:.2f}s)"
+            f"PHASE: {current_phase} (time so far: {phase_start - start_whole:.2f}s)"
        )

-        # Get the current short phase
-        logger.debug(f"PHASE | Current short phase: '{game.current_short_phase}'")
+        # DEBUG: Print the short phase to confirm
+        logger.info(f"DEBUG: current_short_phase is '{game.current_short_phase}'")

        # Prevent unbounded simulation based on year
        year_str = current_phase[1:5]
        year_int = int(year_str)
        if year_int > max_year:
-            logger.info(f"GAME_END | Reached year limit ({year_int} > {max_year}), terminating game")
+            logger.info(f"Reached year {year_int}, stopping the test game early.")
            break

        # If it's a movement phase (e.g. ends with "M"), conduct negotiations
        if game.current_short_phase.endswith("M"):
+            
            if args.planning_phase:
                logger.info("Starting planning phase block...")
                game_history = planning_phase(
@ -258,14 +160,13 @@ def main():
                model_error_stats,
                max_rounds=args.num_negotiation_rounds,
            )
+
        # Gather orders from each power concurrently
        active_powers = [
            (p_name, p_obj)
            for p_name, p_obj in game.powers.items()
            if not p_obj.is_eliminated()
        ]
-        
-        logger.info(f"ORDERS | {current_phase} | Requesting orders from {len(active_powers)} active powers")

        with concurrent.futures.ThreadPoolExecutor(
            max_workers=len(active_powers)
@ -273,10 +174,10 @@ def main():
            futures = {}
            for power_name, _ in active_powers:
                model_id = game.power_model_map.get(power_name, "o3-mini")
-                client = load_model_client(model_id, power_name=power_name)
+                client = load_model_client(model_id)
                possible_orders = gather_possible_orders(game, power_name)
                if not possible_orders:
-                    logger.info(f"ORDERS | {power_name} | No orderable locations, skipping")
+                    logger.info(f"No orderable locations for {power_name}; skipping.")
                    continue
                board_state = game.get_state()

@ -288,24 +189,26 @@ def main():
                    power_name,
                    possible_orders,
                    game_history,
-                    game.phase_summaries,
                    model_error_stats,
                )
                futures[future] = power_name
-                logger.debug(f"ORDERS | {power_name} | Requested orders from {model_id}")
+                logger.debug(f"Submitted get_valid_orders task for {power_name}.")

            for future in concurrent.futures.as_completed(futures):
                p_name = futures[future]
                try:
                    orders = future.result()
+                    logger.debug(f"Validated orders for {p_name}: {orders}")
                    if orders:
-                        logger.debug(f"ORDERS | {p_name} | Received {len(orders)} valid orders")
                        game.set_orders(p_name, orders)
-                        logger.debug(f"ORDERS | {p_name} | Orders set for {game.current_short_phase}")
+                        logger.debug(
+                            f"Set orders for {p_name} in {game.current_short_phase}: {orders}"
+                        )
                    else:
-                        logger.warning(f"ORDERS | {p_name} | No valid orders returned")
+                        logger.debug(f"No valid orders returned for {p_name}.")
                except Exception as exc:
-                    logger.error(f"ORDERS | {p_name} | Request failed: {str(exc)[:150]}")
+                    logger.error(f"LLM request failed for {p_name}: {exc}")
+
        logger.info("Processing orders...\n")
        game.process()
        # Add orders to game history
@ -328,7 +231,8 @@ def main():
                game.order_history[current_phase][power_name],
                results,
            )
-        logger.info(f"PROCESSING | {current_phase} | Phase completed")
+        logger.info("Phase complete.\n")
+
        # Append the strategic directives to the manifesto file
        strategic_directives = game_history.get_strategic_directives()
        if strategic_directives:
@ -343,17 +247,28 @@ def main():
        year_str = current_phase[1:5]
        year_int = int(year_str)
        if year_int > max_year:
-            logger.info(f"GAME_END | Reached year limit ({year_int} > {max_year}), terminating game")
+            logger.info(f"Reached year {year_int}, stopping the test game early.")
            break

    # Save final result
    duration = time.time() - start_whole
-    logger.info(f"GAME_END | Duration: {duration:.2f}s | Saving final state")
-    
-    save_game_state(game, result_folder, game_file_path, model_error_stats, args, is_final=True)
-    
-    logger.info(f"STORAGE | Game data saved in: {result_folder}")
-    logger.info("GAME_END | Simulation complete")
+    logger.info(f"Game ended after {duration:.2f}s. Saving to final JSON...")
+
+    output_path = game_file_path
+    # If the file already exists, append a timestamp to the filename
+    if os.path.exists(output_path):
+        logger.info("Game file already exists, saving with unique filename.")
+        output_path = f"{output_path}_{time.strftime('%Y%m%d_%H%M%S')}.json"
+    to_saved_game_format(game, output_path=output_path)
+
+    # Dump error stats and power model mapping to the overview file
+    with open(overview_file_path, "w") as overview_file:
+        overview_file.write(json.dumps(model_error_stats) + "\n")
+        overview_file.write(json.dumps(game.power_model_map) + "\n")
+        overview_file.write(json.dumps(vars(args)) + "\n")
+
+    logger.info(f"Saved game data, manifesto, and error stats in: {result_folder}")
+    logger.info("Done.")


 if __name__ == "__main__":