make a long form dataframe of each order in game from log data

2026-04-22 16:49:15 +00:00 · 2025-07-01 22:49:00 -04:00 · 2025-07-01 22:49:00 -04:00 · 00ce085e35
commit 00ce085e35
parent 0bd909b30b
1 changed files with 375 additions and 0 deletions
--- a/analysis/make_longform_orders_data.py
+++ b/analysis/make_longform_orders_data.py
@ -0,0 +1,375 @@
+"""
+
+Set-up & constants
+    imports pandas, numpy, json, copy, re, os
+    hard-codes lists for the seven Diplomacy powers, every supply-center (SC) province, and the coastal SC variants
+
+Top-level function make_longform_order_data(game_data_folder, selected_game)
+Runs end-to-end for one game folder and returns a single long-form DataFrame (all_orders_ever).
+
+expected game data files:
+    overview.jsonl → maps each country to the LLM model that played it
+    lmvsgame.json → full turn-by-turn log in the LM vs Game Engine format
+    llm_responses.csv → every prompt/response the agent produced
+
+Build a “turn_actions” super-table
+    state snapshots (units, centers, influence) per phase → status_over_time
+    order strings plus their official adjudication results → orders_over_time
+    concatenate the two; index is COUNTRY_[units|centers|influence|orders], columns are phase names.
+
+Explode into one-row-per-order (all_orders_ever)
+    melt orders_over_time, dropping nulls, so each record has:
+    country, phase, order (raw text, e.g. "A PAR - BUR (MOVE)")
+    classify order with regexes → command ∈ {Move, Hold, Support Move, …}.
+    extract unit_location, destination, boolean SC flags, and the adjudication result.
+
+Annotate ownership & influence
+    Helper lambdas walk back into the phase state to tag:
+    which power currently controls unit_location or destination
+    whether the unit is trespassing or attempting to trespass
+    who owns any piece occupying the square the unit is moving into.
+
+Support logic
+    finds which orders support a given unit and records the supporting powers
+    adds convenience flags (was_supported, supported_by_self, supported_by_other, etc.).
+
+Merge relationship matrices (5 possible states: Enemy, Unfriendly, Neutral, Friendly, Ally)
+    current country's view of all others (relationship_england, …)
+    how all others rate this country (englands_relationship_rating, …).
+
+Add strategic context columns
+    supporting_self, supporting_an_ally
+    weight column unit_order_weight (inverse of the country's total number of unit-orders for averaging).
+
+Fuse LLM reasoning
+    pulls the order-generation rows out of llm_responses.csv
+    extracts free-text “reasoning”, unformatted order blob, length, and success flag (if can be done)
+
+Return / save
+    The function returns the enriched DataFrame
+    Run from CLI to process all games: python make_longform_orders_data.py 
+    
+"""
+
+import pandas as pd
+import numpy as np
+import os 
+import json 
+import copy
+import re 
+import argparse
+
+
+supply_centers = [
+    "ANK", "ARM", "BEL", "BER", "BUD", "BUL", "CON", "DEN", "EDI", "GRE",
+    "HOL", "KIE", "LON", "LVP", "MAR", "MOS", "MUN", "NAP", "PAR", "POR",
+    "ROM", "RUM", "SER", "SEV", "SMY", "SWE", "TRI", "TUN",
+    "VEN", "VIE", "WAR", 
+    "SPA", "STP", "BUL" # coastal provinces
+]
+
+coastal_scs = ["SPA/SC", "SPA/NC",
+    "STP/SC", "STP/NC", 'BUL/EC',
+       'BUL/SC',]
+
+COUNTRIES = ['AUSTRIA', 'ENGLAND', 'FRANCE', 'GERMANY', 'ITALY', 'RUSSIA', 'TURKEY']
+
+def make_longform_order_data(game_data_folder, selected_game):
+    path_to_folder = f"{game_data_folder}/{selected_game}"
+
+    assert os.path.exists(f"{path_to_folder}/overview.jsonl"), f"Overview file not found in {path_to_folder}"
+    overview = pd.read_json(f"{path_to_folder}/overview.jsonl", lines=True)
+    country_to_model = overview.loc[1, COUNTRIES] # map countries to models
+
+    # get all turn actions from lmvs
+    assert os.path.exists(f"{path_to_folder}/lmvsgame.json"), f"LMVS file not found in {path_to_folder}"
+    path_to_file = f"{path_to_folder}/lmvsgame.json"
+
+    # Use the standard `json` library to load the file into a Python object
+    with open(path_to_file, 'r') as f:
+        lmvs_data = json.load(f)
+    ################## PART 1 ##################
+    # build `turn_actions` dataframe
+
+    # Get units at each turn
+    status_over_time = []
+    for phase in lmvs_data["phases"]:
+        phase_list = []
+        for var in ["units", "centers", "influence"]:
+            phase_list.append(pd.Series(phase["state"][var]).rename(phase["name"]).add_suffix(f"_{var}"))
+        status_over_time.append(pd.concat(phase_list))
+        
+    status_over_time = pd.concat(status_over_time, axis=1)
+
+    # Get orders + outcome 
+    orders_over_time = []
+    for phase in lmvs_data["phases"]:
+        phase_orders = copy.deepcopy(phase["orders"])
+        result_of_orders = phase["results"]
+        
+        for country, order_list in phase_orders.items():
+            if order_list:
+                for i, order in enumerate(order_list):
+                    identifier = order[:5]
+                    if result_of_orders.get(identifier, None):
+                        results = '/'.join(result_of_orders[identifier]).upper()
+                        if results:
+                            order_list[i] = order_list[i] + f" ({results})"
+                    
+        orders_over_time.append(pd.Series(phase_orders).rename(phase["name"]).add_suffix("_orders"))
+    orders_over_time = pd.concat(orders_over_time, axis=1)
+
+
+    # index for COUNTRY_[turn_status], columns for PHASE, each value a list
+    turn_actions = pd.concat([orders_over_time, status_over_time])
+
+
+    ################## PART 2 ##################
+    # Data by orders
+
+    # Snippet to pull out and classifier all orders
+    place_identifier = "[A-Z]{3}(?:/[A-Z]{2})?"
+    place_capturing_regex = r"([A-Z]{3})"
+    unit_identifier = rf"[AF] {place_identifier}"
+    unit_move = rf"{unit_identifier} . {place_identifier}"
+
+    possible_commands = {
+        "Move": f"^"+unit_move, # distinguishing this from support
+        "Support Move": f"{unit_identifier} S {unit_move}",
+        "Support Hold": fr"{unit_identifier} S {unit_identifier}(?!\s+[.\-]\s+{place_identifier})",
+        "Convoy": f"F {place_identifier} C {unit_move}", # No convoys in here? 
+        "Hold": f"{unit_identifier} H",
+        "Build": f"{unit_identifier} B",
+        "Disband": f"{unit_identifier} D",
+        "Retreat": f"{unit_identifier} R",
+    }
+    # build the data frame
+    all_orders_ever = turn_actions.loc[turn_actions.index.str.contains("orders")].reset_index(names="country").melt(id_vars="country", 
+                                                                                                    var_name="phase", 
+                                                                                                    value_name="order").dropna().explode("order")
+    all_orders_ever = all_orders_ever.dropna(subset="order").reset_index(drop=True)
+
+    # categorize each order based on regex
+    # note that this will overwrite if multiple regexes match, which is why we've split support into 2 commands
+    for possible_command, regex in possible_commands.items():
+        all_orders_ever.loc[all_orders_ever.order.str.contains(regex, regex=True), "command"] = possible_command
+        
+    all_orders_ever["unit_location"] = all_orders_ever["order"].str.extract(rf"({place_identifier})")
+    all_orders_ever["location_was_sc"] = all_orders_ever["unit_location"].isin(supply_centers) | all_orders_ever["unit_location"].isin(coastal_scs)
+
+    # only MOVE has a destination
+    all_orders_ever["destination"] = np.where(
+        all_orders_ever["command"]=="Move",
+        all_orders_ever["order"].str.extract(rf"{unit_identifier} . ({place_identifier})", expand=False),
+        np.nan
+    )
+    all_orders_ever["destination_was_sc"] = all_orders_ever["destination"].isin(supply_centers) | all_orders_ever["destination"].isin(coastal_scs)
+
+    # Retreat also has a destination
+    all_orders_ever.loc[all_orders_ever["command"]=="Retreat", "destination"] = all_orders_ever.loc[all_orders_ever["command"]=="Retreat", "order"].str.extract(rf"{unit_identifier} R ({place_identifier})", expand=False)
+
+    all_orders_ever["immediate_result"] = all_orders_ever["order"].str.extract(r"\(([^)]+)\)")
+    all_orders_ever["immediate_result"] = all_orders_ever["immediate_result"].fillna("PASS")
+
+    all_orders_ever["country"] = all_orders_ever["country"].str.replace("_orders", "")
+        
+    all_orders_ever["model"] = all_orders_ever["country"].map(country_to_model)
+    all_orders_ever["model_short_name"] = all_orders_ever["model"].str.split("/").str[-1]
+    all_orders_ever["country_model"] = all_orders_ever["country"] + " (" + all_orders_ever["model_short_name"] + ")"
+
+    def check_location_influence(phase_id, location):
+        if pd.isnull(location):
+            return np.nan
+        current_influence = turn_actions.loc[turn_actions.index.str.contains("influence"), phase_id]
+        current_influence.index = current_influence.index.str.replace("_influence", "")
+        for country, influence in current_influence.items():
+            if location in influence:
+                return country
+        return "Unowned"
+
+    all_orders_ever["unit_location_affiliation"] = all_orders_ever.apply(lambda row: check_location_influence(row["phase"],
+                                                                                                            row["unit_location"]), axis=1)
+    all_orders_ever["destination_affiliation"] = all_orders_ever.apply(lambda row: check_location_influence(row["phase"],
+                                                                                                            row["destination"]), axis=1)
+
+    def find_supporting_country(unit_command, command_type, phase):
+        if command_type == "Move" or command_type == "Hold":
+            potential_supports = all_orders_ever[(all_orders_ever["phase"] == phase) & 
+                                                (all_orders_ever["command"].isin(["Support Move", "Support Hold"]))]
+            potential_supports = potential_supports[potential_supports["order"].str.contains(unit_command)]
+            if potential_supports.empty:
+                return np.nan
+            else:
+                return ",".join(potential_supports["country"].tolist())
+        return np.nan
+
+    all_orders_ever["supported_by"] = all_orders_ever.apply(lambda row: find_supporting_country(row["order"], row["command"], row["phase"]), axis=1)
+    all_orders_ever["in_anothers_territory"] =( all_orders_ever["country"] != all_orders_ever["unit_location_affiliation"]) & (all_orders_ever["unit_location_affiliation"] != "Unowned")
+    all_orders_ever["moving_into_anothers_territory"] = (all_orders_ever["country"] != all_orders_ever["destination_affiliation"]) & (all_orders_ever["destination_affiliation"].notnull()) & (all_orders_ever["destination_affiliation"] != "Unowned")
+
+    def find_owner_of_unit(unit_location, phase):
+        if pd.notnull(unit_location):
+            unit_status = turn_actions.loc[turn_actions.index.str.contains("_units"), phase]
+            unit_status.index = unit_status.index.str.replace("_units", "")
+            for country, units in unit_status.items():
+                for unit in units:
+                    if re.match(f"[AF] {unit_location}", unit):
+                        return country
+
+    # where were they going? what was their destination like?
+    def find_destination_info(destination, phase):
+        if pd.notnull(destination):
+            country = find_owner_of_unit(destination, phase)
+            destination_unit_orders = all_orders_ever[(all_orders_ever["country"] == country) & 
+                                                                (all_orders_ever["phase"] == phase) & 
+                                                                (all_orders_ever["unit_location"] == destination)]
+            if not destination_unit_orders.empty:
+                return {"destination_unit_owner": country, 
+                                "destination_unit_order": destination_unit_orders["command"].squeeze(),
+                                "destination_unit_outcome":destination_unit_orders["immediate_result"].squeeze(),
+                                "destination_unit_supported_by": destination_unit_orders["supported_by"].squeeze()}    
+
+    destination_unit_info = all_orders_ever.apply(lambda row: find_destination_info(row["destination"], row["phase"]), axis=1).apply(pd.Series)
+    destination_unit_info["destination_was_occupied"] = destination_unit_info["destination_unit_owner"].notnull()
+
+    all_orders_ever = pd.concat([all_orders_ever, destination_unit_info], axis=1)
+
+    # if a Support action: who were they supporting? what was their support doing?
+    def find_support_recipient_info(unit_order, command, phase):
+        if "Support" in command:
+            recipient_location = re.match(rf"{unit_identifier} S [AF] ({place_identifier})", unit_order).group(1)
+            recipient_country = find_owner_of_unit(recipient_location, phase)
+            recipient_order_info = all_orders_ever[(all_orders_ever["country"] == recipient_country) & 
+                                                (all_orders_ever["phase"] == phase) & 
+                                                (all_orders_ever["unit_location"] == recipient_location)]
+            return {"recipient_unit_owner": recipient_country, "recipient_unit_outcome": recipient_order_info["immediate_result"].squeeze(),
+                    "recipient_unit_in_anothers_territory": recipient_order_info["in_anothers_territory"].squeeze(),
+                    "recipient_unit_moving_into_anothers_territory": recipient_order_info["moving_into_anothers_territory"].squeeze(),
+                    "recipient_unit_destination_occupied": recipient_order_info["destination_was_occupied"].squeeze()}
+
+    support_recipient_info = all_orders_ever.apply(lambda row: find_support_recipient_info(row["order"], row["command"], row["phase"]), axis=1).apply(pd.Series)
+    all_orders_ever = pd.concat([all_orders_ever, support_recipient_info], axis=1)
+
+    # add relationships with other countries
+    agent_relationship_matrix_over_time = {}
+    for phase in lmvs_data["phases"]:
+        agent_relationship_matrix_over_time[phase["name"]] = pd.DataFrame(phase.get("agent_relationships", {}))
+    longform_relationships = pd.concat(agent_relationship_matrix_over_time).reset_index(names=["phase", "agent"])
+    longform_relationships.columns = longform_relationships.columns.str.lower()
+    longform_relationships[['austria', 'england', 'france', 'germany', 'italy',
+        'russia', 'turkey']] = longform_relationships[['austria', 'england', 'france', 'germany', 'italy',
+        'russia', 'turkey']].fillna("Self") 
+    longform_relationships = longform_relationships.add_prefix("relationship_")
+    all_orders_ever = pd.merge(all_orders_ever, longform_relationships, 
+            left_on=["phase", "country"], right_on=["relationship_phase", "relationship_agent"]).drop(columns=["relationship_phase", "relationship_agent"])
+    
+    alternate_relationship_view = pd.concat(agent_relationship_matrix_over_time)
+    alternate_relationship_view.index.names = ["phase", "agent"]
+    alternate_relationship_view = alternate_relationship_view.stack().reset_index().rename(columns={"level_2":"recipient",
+            0:"status"}).set_index(["phase", "recipient", 
+            "agent"])["status"].unstack("agent").fillna("Self").add_suffix("s_relationship_rating").reset_index()
+    all_orders_ever = pd.merge(all_orders_ever, alternate_relationship_view, 
+            left_on=["phase", "country"], right_on=["phase", "recipient"]).drop(columns=["recipient"])
+
+
+    # if action was supporting
+    all_orders_ever["supporting_self"] = all_orders_ever["country"]==all_orders_ever["recipient_unit_owner"]
+    all_orders_ever["supporting_an_ally"] = (all_orders_ever["country"] !=all_orders_ever["recipient_unit_owner"]) & (all_orders_ever["recipient_unit_owner"].notnull())
+
+    def countries_aside_from(a_country):
+        return [country for country in all_orders_ever["country"].unique() if country != a_country]
+
+    def check_country(supporters, country):
+        if pd.isnull(supporters):
+            return False
+        for other_countries in countries_aside_from(country):
+            if other_countries in supporters:
+                return True
+        return False
+
+    # helpers
+    all_orders_ever["was_supported"] = all_orders_ever["supported_by"].notnull()
+    all_orders_ever["supported_by_self"] = all_orders_ever.apply(lambda x: x["country"] in x["supported_by"] if pd.notnull(x["supported_by"]) else False, axis=1)
+    all_orders_ever["supported_by_other"] = all_orders_ever.apply(lambda x: check_country(x["supported_by"], x["country"]), axis=1)
+
+    all_orders_ever["destination_unit_was_supported"] = all_orders_ever["destination_unit_supported_by"].notnull()
+
+    # add number of unit orders ever made
+    unit_order_weight = 1 / all_orders_ever.groupby("country").size()
+    all_orders_ever["unit_order_weight"] = all_orders_ever["country"].map(unit_order_weight)
+
+    # Get llm order planning
+    assert os.path.exists(f"{path_to_folder}/llm_responses.csv"), f"LLM responses file not found in {path_to_folder}"
+    all_responses = pd.read_csv(f"{path_to_folder}/llm_responses.csv")
+    order_generations = all_responses[all_responses["response_type"] == "order_generation"]
+    order_reasoning_details = order_generations[["power", "phase", "raw_response", "success"]]
+    
+    extracted_order_reasoning = order_reasoning_details["raw_response"].fillna("").apply(lambda x: pd.Series(re.split("parsable output", x, flags=re.IGNORECASE)))
+
+    order_reasoning_details["reasoning"] = extracted_order_reasoning.loc[:, 0]
+    if len(extracted_order_reasoning.columns) > 1:
+        order_reasoning_details["unformatted_orders"] = extracted_order_reasoning.loc[:, 1:].fillna("").apply(lambda x: "\n".join(x), axis=1)
+    else:
+        order_reasoning_details["unformatted_orders"] = ""
+    order_reasoning_details["reasoning_length"] = order_reasoning_details["reasoning"].str.split(" ").apply(len)
+
+    all_orders_ever = pd.merge(all_orders_ever,
+                            order_reasoning_details.rename(columns={"success":"automated_order_extraction_status"}), 
+                            left_on=["country", "phase"], right_on=["power", "phase"], how="left").drop(columns=["power"])
+    return all_orders_ever
+    
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Create longform order data from diplomacy game logs.")
+    
+    parser.add_argument(
+        "--selected_game", 
+        type=str, 
+        nargs='*', 
+        help="One or more specific games to process. If not provided, all games in the data folder will be processed."
+    )
+    parser.add_argument(
+        "--game_data_folder", 
+        type=str, 
+        default=game_data_folder, 
+        help=f"The folder where game data is stored. Defaults to {game_data_folder}"
+    )
+    parser.add_argument(
+        "--output_folder", 
+        type=str, 
+        default=f"{ai_diplomacy}/Game Data - Analysis/orders-06.29.25", 
+        help="The folder to save the output CSV files."
+    )
+
+    args = parser.parse_args()
+
+    current_game_data_folder = args.game_data_folder
+    output_folder = args.output_folder
+
+    if not os.path.exists(output_folder):
+        print(f"Output folder {output_folder} not found, creating it.")
+        os.makedirs(output_folder)
+
+    games_to_process = args.selected_game
+    if not games_to_process:
+        games_to_process = os.listdir(current_game_data_folder)
+
+    for game_name in games_to_process:
+        if game_name == ".DS_Store":
+            continue
+        
+        game_path = os.path.join(current_game_data_folder, game_name)
+        if not os.path.isdir(game_path):
+            continue
+
+        print(f"Processing {game_name}...")
+        try:
+            data = make_longform_order_data(current_game_data_folder, game_name)
+            output_path = os.path.join(output_folder, f"{game_name}_orders_data.csv")
+            data.to_csv(output_path, index=False)
+            print(f"Successfully saved data for {game_name} to {output_path}")
+        except FileNotFoundError as e:
+            print(f"Could not process {game_name}. Missing file: {e.filename}")
+        except Exception as e:
+            print(f"An unexpected error occurred while processing {game_name}: {e}")
+
+    print("Processing complete.")