init-commit

2026-04-25 17:10:49 +00:00 · 2025-05-23 15:27:15 +08:00 · 2025-05-23 15:27:15 +08:00 · 18a552597a
commit 18a552597a
3461 changed files with 1150579 additions and 0 deletions
--- a/internbootcamp/bootcamp/calcudoku/calcudoku.py
+++ b/internbootcamp/bootcamp/calcudoku/calcudoku.py
@ -0,0 +1,233 @@
+import re
+import ast
+import json
+import sys
+sys.path.append('./')
+from internbootcamp.bootcamp.base import Basebootcamp
+# from environments import CalcudokuEnvironment
+from internbootcamp.libs.calcudoku.calcudoku_generator import CalcudokuGenerator
+import random
+
+class Calcudokubootcamp(Basebootcamp):
+    
+    def __init__(self, size:int = 6,  group_size_range:tuple =(1,4)):
+        super().__init__()   
+        self.size = size
+        self.group_size_range = group_size_range
+        # self.env = CalcudokuEnvironment()
+    
+    def generator(self, size:int =6, group_size_range:tuple =(1,4), seed:int = None):
+        generator = CalcudokuGenerator(n=size, group_size_range=group_size_range, seed=seed)
+        self.grid = generator.generate_puzzle()
+        return self.grid
+
+    def get_question(self):
+        statements = [f"""You are an intelligent assistant specializing in solving custom puzzle problems. Below is a specific rule defined for a custom puzzle. Your task is to apply this rule accurately to the provided question.
+
+    ### Instructions:
+    
+    1. Thoroughly understand the rule provided. If needed, break down the rule into simpler components or steps.
+    2. Apply the rule carefully to address the question presented.
+    3. Verify your answer to ensure it aligns with the rule and the context of the puzzle.
+    
+### Calcudoko Puzzle Rule:
+
+1.Calcudoko is a sudoku-like game. The game is played on an NxN grid. In each row and column, fill in the numbers from 1 to N. 
+2.As in sudoku, each number can appear only once in each row and column. 
+3.The grid is divided into groups, each of which has a target number and an operator that indicates that the numbers in the group must equal the target number after a specified operation.
+4.The operations :
+    4.Sum: + The numbers in this group must add to the target value.
+    4.Difference: - One of the numbers in this group, minus the rest, must equal the target value (the number to be subtracted from may be any of the cells).
+    4.Product: * The numbers in this group must multiply to produce the target value.
+    4.Ratio: / One of the numbers in this group, divided by all of the others, must equal the target value. As in a difference group, which of the cells contains the number to be divided is not specified.
+5.Numbers may be repeated within a group (so long as they're not also repeated within a row or column).  
+6.Puzzles are parsed in a "puzzle spec" format, where rows are given one per line, with cells separated by spaces. Groups are labelled with alphabetic characters, which are then used to identify cell membership. 
+
+### Question
+
+Now the "puzzle spec" of a Calcudoko is: 
+{self.grid} 
+
+The answer needs to provide the corresponding numbers for all positions in the Calcudoko.
+""",
+f"""
+Calcudoko is a sudoku-like game. The game is played on an NxN grid. In each row and column, fill in the numbers from 1 to N. 
+As in sudoku, each number can appear only once in each row and column. 
+The grid is divided into groups, each of which has a target number and an operator that indicates that the numbers in the group must equal the target number after a specified operation.
+Sum: +
+The numbers in this group must add to the target value.
+Difference: -
+One of the numbers in this group, minus the rest, must equal the target value (the number to be subtracted from may be any of the cells).
+Product: *
+The numbers in this group must multiply to produce the target value.
+Ratio: /
+One of the numbers in this group, divided by all of the others, must equal the target value. As in a difference group, which of the cells contains the number to be divided is not specified.
+
+Numbers may be repeated within a group (so long as they're not also repeated within a row or column).  
+Puzzles are parsed in a "puzzle spec" format, where rows are given one per line, with cells separated by spaces. Groups are labelled with alphabetic characters, which are then used to identify cell membership. 
+
+Now the "puzzle spec" of a Calcudoko is: 
+{self.grid} 
+
+The answer needs to provide the corresponding numbers for all positions in the Calcudoko.
+"""]
+        
+        return statements[random.randint(0,len(statements)-1)]
+
+    def case_generator(self):
+        grid = self.generator(self.size, self.group_size_range)
+        self.prompt = self.get_question()
+        return self.parse_question(self.prompt)
+
+    def prompt_func(self, identity) -> str:
+        """
+        Process the input_data and return the processed prompt.
+        
+        Args:
+            question_ori: The question to be processed.
+        
+        Returns:
+            str: The processed prompt.
+        """
+        # print("`identity` is ignored!!!!!")
+
+        prompt = self.prompt + """\nThe output should be given in order from left to right, top to bottom, with each element separated by a space and different lines separated by a comma.
+Ensure that your final answer is wrapped in double square brackets,like this: [[1 3 2,2 1 3,3 2 1]]. Making sure the size of your answer should be same as the size of the Calcudoko."""
+        return prompt
+        # instruction_following = """Let's think step by step and output the final answer with an example json formatting for a 5x5 board: 
+        # Final-answer: ```json
+        # {'A': [(row_a, col_a)],'B': [(row_b, col_b)],'C': [(row_c, col_c)],'D': [(row_d, col_d)],'E': [(row_e, col_e)]}
+        # ```
+        # """
+        # prompt = question_ori + '\n' + instruction_following
+        # return prompt
+
+    @staticmethod
+    def parse_question(question: str) -> dict:
+        # 匹配谜题规格的数组部分
+        match = re.search(r"\[(?:'[^']*'[,\s]*)*\]", question)
+        if not match:
+            return None
+        array_str = match.group(0)
+        try:
+            puzzle_spec = ast.literal_eval(array_str)
+        except:
+            return None
+
+        puzzle_rows = [row.split() for row in puzzle_spec]
+        n = len(puzzle_rows)
+        for row in puzzle_rows:
+            if len(row) != n:
+                return None
+
+        groups: Dict[str, tuple] = {}
+        puzzle_grid: List[List[str]] = []
+        for row in puzzle_rows:
+            grid_row = []
+            for cell in row:
+                group_char = cell[0]
+                grid_row.append(group_char)
+                # 提取运算符和目标值（如果有的话）
+                op_match = re.fullmatch(r'^[A-Za-z]([+*/-])(\d+)$', cell)
+                if op_match and group_char not in groups:
+                    op = op_match.group(1)
+                    target = int(op_match.group(2))
+                    groups[group_char] = (op, target)
+            puzzle_grid.append(grid_row)
+        
+        return {
+            'groups': groups,
+            'grid': puzzle_grid,
+            'size': n
+        }
+
+    @staticmethod
+    def extract_output(response):
+        """
+        Extract the output from the solution.
+        
+        Args:
+            output: Model output to be processed.
+        
+        Returns:
+            The processed output.
+        """
+        # 提取双括号中的内容
+        match = re.findall(r'\[\[(.*?)\]\]', response, re.DOTALL)
+        if len(match) == 0:
+            return None
+        content = match[-1]
+        rows = [row.strip('[] ') for row in content.split(',')]
+        solution = []
+        for row in rows:
+            try:
+                numbers = list(map(int, row.strip().split()))
+            except:
+                return None
+            solution.append(numbers)
+        return solution
+        
+
+    @staticmethod
+    def check_solution(parsed_question: dict, parsed_response: dict) -> bool:
+        n = parsed_question['size']
+        grid = parsed_question['grid']
+        groups = parsed_question['groups']
+        solution = parsed_response
+        
+        # 检查行和列的有效性
+        if len(solution) != n or any(len(row) != n for row in solution):
+            return False
+        for i in range(n):
+            if sorted(solution[i]) != list(range(1, n+1)):
+                return False
+            col = [solution[j][i] for j in range(n)]
+            if sorted(col) != list(range(1, n+1)):
+                return False
+        
+        # 构建分组数字映射
+        group_numbers = {}
+        for i in range(n):
+            for j in range(n):
+                group = grid[i][j]
+                num = solution[i][j]
+                if group not in group_numbers:
+                    group_numbers[group] = []
+                group_numbers[group].append(num)
+        
+        # 验证每个分组
+        for group, info in groups.items():
+            nums = group_numbers.get(group, [])
+            op, target = info
+            
+            if op == '+':
+                if sum(nums) != target:
+                    return False
+            elif op == '*':
+                product = 1
+                for num in nums:
+                    product *= num
+                if product != target:
+                    return False
+            elif op == '-':
+                total = sum(nums)
+                if not any(2*x == total + target for x in nums):
+                    return False
+            elif op == '/':
+                for x in nums:
+                    product = 1
+                    for num in nums:
+                        if num != x:
+                            product *= num
+                    if product != 0 and x / product == target:
+                        break
+                else:
+                    return False
+            else:
+                return False
+        
+        return True
+
+    @classmethod
+    def _verify_correction(cls, solution, identity):
+        return cls.check_solution(identity, solution)