init-commit

2026-04-23 16:55:02 +00:00 · 2025-05-23 15:27:15 +08:00 · 2025-05-23 15:27:15 +08:00 · 18a552597a
commit 18a552597a
3461 changed files with 1150579 additions and 0 deletions
--- a/internbootcamp/bootcamp/game24/game_default.py
+++ b/internbootcamp/bootcamp/game24/game_default.py
@ -0,0 +1,191 @@
+import re
+import json
+from internbootcamp.bootcamp.base import Basebootcamp
+from internbootcamp.libs.game24.game24 import Game24Plus
+
+def remove_boxed(s):
+    if "\\boxed " in s:
+        left = "\\boxed "
+        assert s[:len(left)] == left
+        return s[len(left):]
+
+    left = "\\boxed{"
+
+    assert s[:len(left)] == left
+    assert s[-1] == "}"
+
+    return s[len(left):-1]
+
+
+def last_boxed_only_string(string):
+    idx = string.rfind("\\boxed")
+    if "\\boxed " in string:
+        return "\\boxed " + string.split("\\boxed ")[-1].split("$")[0]
+    if idx < 0:
+        idx = string.rfind("\\fbox")
+        if idx < 0:
+            return None
+
+    i = idx
+    right_brace_idx = None
+    num_left_braces_open = 0
+    while i < len(string):
+        if string[i] == "{":
+            num_left_braces_open += 1
+        if string[i] == "}":
+            num_left_braces_open -= 1
+            if num_left_braces_open == 0:
+                right_brace_idx = i
+                break
+        i += 1
+
+    if right_brace_idx is None:
+        retval = None
+    else:
+        retval = string[idx:right_brace_idx + 1]
+
+    return retval
+
+class Game24bootcamp(Basebootcamp):
+    def __init__(self, num_numbers=4, range_max=100, target_max=100, seed = None):
+        # super.__init__()
+        self.num_numbers = num_numbers
+        self.range_max = range_max
+        self.target_max = target_max
+        self.seed = seed
+        self.game24Plus = Game24Plus(num_numbers,range_max,target_max,seed)
+        
+    def case_generator(self) -> object:
+        """
+        生成一组数字和目标值。
+        """
+        # game24Plus = Game24Plus(num_numbers,range_max,target_max,seed)
+        self.numbers = self.game24Plus.get_numbers()
+        self.target, self.operations = self.game24Plus.get_target_limit_range(self.numbers)
+        return {'puzzle': ' '.join(str(i) for i in self.numbers), 'target':self.target}
+    
+    def prompt_func(self, identity) -> str:
+        """
+        Process the input_data and return the processed prompt.
+        
+        Args:
+            question_ori: The question to be processed.
+        
+        Returns:
+            str: The processed prompt.
+        """
+        instruction = f"请解决以下问题：使用数字 {identity['puzzle']} 通过加减乘除得到 {identity['target']}。"
+        instruction_following = """Let's think step by step and output the final answer within \\boxed{}.The final answer should be all input numbers with basic operations, and parentheses can be used to change the order of operations. For example "Final Answer: \\boxed{6+6+(6+6)}"."""
+        
+        prompt = instruction + '\n' + instruction_following
+        return prompt
+    
+    @staticmethod
+    def extract_output(output):
+        """
+        Extract the output from the solution.
+        
+        Args:
+            output: Model output to be processed.
+        
+        Returns:
+            The processed output.
+        """
+        output = last_boxed_only_string(output)
+        if output is None:
+            return None
+        return remove_boxed(output)
+    
+    @staticmethod
+    def _normalize_solution(solution):
+        """
+        Normalize the solution.
+        """
+        solution = solution.replace("**", "")
+        solution = solution.replace("\\times", "*")
+        solution = solution.replace("\\div", "/")
+        solution = solution.replace("\\left", "")
+        solution = solution.replace("\\right", "")
+        return solution
+        
+    @classmethod 
+    def _verify_correction(cls, solution, identity)->bool:
+        """
+        Verify the correction of the solution.
+        """ 
+        puzzle, target = identity['puzzle'], identity['target']
+        current_numbers = puzzle.split()
+        solution = cls._normalize_solution(solution)
+        # 提取所有数字
+        numbers = re.findall(r'\d+', solution)
+        # 提取所有运算符
+        operators = re.findall(r'[+\-*/]', solution)
+        
+        # 检查数字
+        if len(numbers) != len(current_numbers):
+            return False
+        for n in numbers:
+            if n not in current_numbers:
+                return False
+            current_numbers.remove(n)
+        if current_numbers:
+            return False
+        # 检查运算符
+        if '**' in solution or '//' in solution:
+            return False
+        if any(op not in '+-*/' for op in operators):
+            return False
+        
+        try:
+            # 计算结果
+            result = eval(solution)
+            if result != int(target):
+                return False
+        except:
+            return False
+        
+        return True
+        
+        
+
+
+
+if __name__ == '__main__':
+    bootcamp = Game24bootcamp
+    data = [
+        {
+            "puzzle": "6 6 6 6",
+            "target": "24",
+            "solution": "\\boxed{6*6-6/6}",
+        },
+        {
+            "puzzle": "5 9 10 20",
+            "target": "30",
+            "solution": "\\boxed{5*10-9+20}",
+        },
+        {
+            "puzzle": "5 9 10 11",
+            "target": "30",
+            "solution": "\\boxed{5 * 10-9-11}",
+        },
+        {
+            "puzzle": "5 9 10 11",
+            "target": "30",
+            "solution": "\\boxed{5 \\times 10-(9+11)}",
+        },
+        {
+            "puzzle": "5 9 10 11",
+            "target": "30",
+            "solution": "\\boxed{5\\times10-9+11}",
+        },
+        {
+            "puzzle": [0, 1, 3, 4],
+            "target": "7",
+            "solution": "\\boxed{(4 + 3) / (1 + 0)}",
+        },
+
+    ]
+    
+    for d in data:
+        print(bootcamp.verify_score(d['solution'], d, short_threshold=1))
+