init-commit

2026-04-24 17:05:00 +00:00 · 2025-05-23 15:27:15 +08:00 · 2025-05-23 15:27:15 +08:00 · 18a552597a
commit 18a552597a
3461 changed files with 1150579 additions and 0 deletions
--- a/internbootcamp/bootcamp/sudoku/sudoku.py
+++ b/internbootcamp/bootcamp/sudoku/sudoku.py
@ -0,0 +1,374 @@
+"""# 谜题训练场开发任务
+
+## 任务概述
+你是一位资深程序员，我需要你帮我实现一个特定谜题的训练场环境类。这个类继承自`Basebootcamp`，用于生成谜题实例并验证解答。
+
+## 背景说明
+我正在开发一系列谜题训练场，每个训练场对应一个特定类型的谜题。训练场类命名为`{PuzzleName}bootcamp`，其中`PuzzleName`是谜题的名称。
+
+每个训练场类主要提供两个核心功能：
+1. 生成该谜题类型的问题实例
+2. 验证用户对问题的回答是否正确
+
+## 技术接口规范
+
+### 类方法实现要求
+
+```python
+class {PuzzleName}bootcamp(Basebootcamp):
+    def __init__(self, **params):
+        \"\"\"
+        请你自定义params，以保存该puzzle相关的参数，例如网格大小等，参数配有默认值
+        \"\"\"
+        pass
+    
+    def case_generator(self):
+        \"\"\"
+        生成谜题实例，提示：为保证谜题有解，可以先生成结果再对结果处理得到谜题
+        返回：一个可JSON序列化的字典（避免包含set等无法通过json.dumps处理的数据结构）
+        \"\"\"
+        pass
+    
+    @staticmethod
+    def prompt_func(question_case) -> str:
+        \"\"\"
+        将case_generator生成的谜题实例转换为文本形式的问题，问题中包含问题背景、对谜题规则的介绍、具体要解决的谜题实例、期望最终答案的格式，
+        例如：你是xxxx，请你解答yyyy，规则如下：yyyy，最终答案放置在：zzzzz
+
+        参数:
+            question_case: 由case_generator生成的谜题实例
+            
+        返回:
+            str: 格式化的问题字符串
+            
+        注意:
+            1. 需考虑问题的格式，以便后续能正确提取
+            2. 问题描述中应包含期望的答案格式说明，以便后续能正确提取，为了避免抽取时匹配出干扰项，请要求模型将答案放在特定标签，如[answer] [/answer]内
+        \"\"\"
+        pass
+    
+    @staticmethod
+    def extract_output(output):
+        \"\"\"
+        从LLM的回复中提取符合格式要求的答案，如有多个，请抽取最后一个，避免使用re.search等只抽取第一个结果的方式。
+        
+        参数:
+            output: LLM的完整输出（包含原始问题和回答）
+            
+        返回:
+            提取的答案，若未找到符合格式的答案则返回None
+        \"\"\"
+        pass
+    
+    @classmethod
+    def _verify_correction(cls, solution, identity):
+        \"\"\"
+        验证提取的答案是否正确，注意一个问题可以能有多个解，按照谜题规则进行检验，不要直接匹配可能的答案。
+        
+        参数:
+            solution: extract_output提取的答案
+            identity: case_generator生成的谜题实例
+            
+        返回:
+            bool: 答案是否正确
+        \"\"\"
+        pass
+```
+
+### 验证评分方法（基类已实现）
+
+```python
+@classmethod
+def verify_score(cls, model_output, identity:dict, format_score=0.1) -> float:
+    \"\"\"
+    验证输出结果并评分。
+    
+    参数:
+        model_output: 模型的完整输出
+        identity: 谜题实例（由case_generator生成）
+        format_score: 答案格式正确时的基础分数
+    
+    返回:
+        float: 评分结果（0-1之间）
+    \"\"\"
+    score = 0. 
+    try:
+        extract_solution = cls.extract_output(model_output)
+        if extract_solution is None:
+            return score
+        else:
+            score = format_score # 格式正确时的基础分数
+        if cls._verify_correction(extract_solution, identity):
+            score = 1.  # 答案完全正确时的满分
+    except Exception as e:
+        # 处理异常情况
+        pass
+    return score
+```
+
+### 使用示例
+
+```python
+# 初始化谜题训练场
+bootcamp = Puzzlebootcamp()
+
+# 生成谜题实例
+case = bootcamp.case_generator()
+
+# 将谜题转换为文本问题
+prompt = Puzzlebootcamp.prompt_func(case)
+
+# 获取LLM对问题的解答
+response = get_response(prompt, \"LLM\")
+
+# 从完整对话中提取答案
+extracted_output = Puzzlebootcamp.extract_output(prompt + response)
+
+# 验证答案并评分
+score = Puzzlebootcamp.verify_score(extracted_output, case)
+```
+
+## 你的任务
+请根据以下谜题描述（谜题描述可能不完整，请先结合你的知识澄清规则），实现一个完整的谜题训练场类：
+
+### 谜题描述
+
+Sudoku is a logic-based number placement puzzle played on a square grid divided into smaller subgrids (called \"regions\" or \"blocks\"). The rules are as follows:
+
+1. **Grid Structure**:  
+   - The puzzle grid is a square of size N×N, where N is a perfect square (e.g., 9×9, 16×16).  
+   - The grid is subdivided into N smaller rectangular regions, each of size √N×√N. For example, a 9×9 grid has nine 3×3 regions.
+
+2. **Number Placement**:  
+   - The grid is partially filled with numbers (or symbols) at the start.  
+   - The solver must fill every empty cell with a number from **1 to N** (or symbols equivalent in count to N).
+
+3. **Core Rules**:  
+   - **Row Constraint**: Each number must appear **exactly once** in every row.  
+   - **Column Constraint**: Each number must appear **exactly once** in every column.  
+   - **Region Constraint**: Each number must appear **exactly once** in every subgrid/region.  
+
+The puzzle is solved when all cells are filled while satisfying all three constraints. No arithmetic or guessing is required—only logical deduction.
+
+
+请完成上述谜题的训练场环境类实现，包括所有必要的方法。
+"""
+
+from bootcamp import Basebootcamp
+import math
+import random
+from typing import List, Optional
+
+class Sudokubootcamp(Basebootcamp):
+    def __init__(self, size: int = 9):
+        """
+        初始化数独训练场参数
+        
+        参数:
+            size: 数独尺寸（必须为完全平方数，默认9）
+        """
+        sqrt_n = math.isqrt(size)
+        if sqrt_n * sqrt_n != size:
+            raise ValueError("Size必须为完全平方数")
+        self.size = size
+        self.sqrt_n = sqrt_n
+    
+    def case_generator(self) -> dict:
+        """
+        生成数独谜题实例
+        
+        返回包含以下信息的字典:
+        - puzzle: 数独初始网格（0表示空格）
+        - size: 数独尺寸
+        - region_rows: 子区域行数
+        - region_cols: 子区域列数（同region_rows）
+        """
+        # 生成完整解
+        solution = self._generate_full_sudoku()
+        
+        # 挖空50%的格子（可根据需求调整比例）
+        puzzle = self._dig_holes(solution.copy(), dig_prob=0.5)
+        
+        return {
+            "puzzle": [row.copy() for row in puzzle],
+            "size": self.size,
+            "region_rows": self.sqrt_n,
+            "region_cols": self.sqrt_n
+        }
+
+    @staticmethod
+    def prompt_func(question_case: dict) -> str:
+        """
+        将数独实例转换为自然语言描述的问题
+        
+        参数:
+            question_case: case_generator生成的谜题实例
+            
+        返回:
+            包含规则说明和当前谜题状态的格式化字符串
+        """
+        puzzle = question_case["puzzle"]
+        size = question_case["size"]
+        region_size = question_case["region_rows"]
+        
+        prompt = f"""你是一个专业数独玩家，请解决以下{size}x{size}的数独谜题。规则要求：
+1. 每行必须包含1-{size}所有数字，无重复
+2. 每列必须包含1-{size}所有数字，无重复
+3. 每个{region_size}x{region_size}的子区域必须包含1-{size}所有数字，无重复
+
+当前谜题状态（0表示空格）：
+"""
+        for i, row in enumerate(puzzle):
+            prompt += f"第{i+1}行：" + " ".join(str(n) if n != 0 else "▢" for n in row) + "\n"
+
+        prompt += "\n请将完整解答按如下格式放在[answer]标记之间：\n[answer]\n1 2 3 ...\n4 5 6 ...\n...\n[/answer]"
+        return prompt
+
+    @staticmethod
+    def extract_output(output: str) -> Optional[List[List[int]]]:
+        """
+        从模型输出中提取最后一个数独解
+        
+        参数:
+            output: 包含[answer]标记的完整输出文本
+            
+        返回:
+            二维整数矩阵，解析失败时返回None
+        """
+        import re
+        matches = re.findall(r'\[answer\](.*?)\[/answer\]', output, re.DOTALL)
+        if not matches:
+            return None
+            
+        try:
+            solution = []
+            for line in matches[-1].strip().split('\n'):
+                nums = list(map(int, line.strip().split()))
+                if nums:
+                    solution.append(nums)
+            return solution
+        except:
+            return None
+
+    @classmethod
+    def _verify_correction(cls, solution: List[List[int]], identity: dict) -> bool:
+        """
+        验证解的正确性
+        
+        参数:
+            solution: 用户提交的解
+            identity: 谜题实例信息
+            
+        返回:
+            布尔值表示解的正确性
+        """
+        def is_valid_region(grid, row_start, col_start, size, region_size) -> bool:
+            """验证子区域有效性"""
+            nums = set()
+            for i in range(row_start, row_start+region_size):
+                for j in range(col_start, col_start+region_size):
+                    num = grid[i][j]
+                    if num < 1 or num > size or num in nums:
+                        return False
+                    nums.add(num)
+            return True
+
+        puzzle = identity["puzzle"]
+        size = identity["size"]
+        region_size = identity["region_rows"]
+        
+        # 基本维度检查
+        if len(solution) != size or any(len(row) != size for row in solution):
+            return False
+        
+        # 验证初始条件
+        for i in range(size):
+            for j in range(size):
+                if puzzle[i][j] != 0 and solution[i][j] != puzzle[i][j]:
+                    return False
+        
+        # 验证行、列、子区域
+        valid_range = set(range(1, size+1))
+        for i in range(size):
+            if set(solution[i]) != valid_range:  # 行验证
+                return False
+            if set(solution[j][i] for j in range(size)) != valid_range:  # 列验证
+                return False
+            
+        # 子区域验证
+        for i in range(0, size, region_size):
+            for j in range(0, size, region_size):
+                if not is_valid_region(solution, i, j, size, region_size):
+                    return False
+        
+        return True
+
+    def _generate_full_sudoku(self) -> List[List[int]]:
+        """生成有效完整数独的核心算法"""
+        size = self.size
+        region_size = self.sqrt_n
+        grid = [[0]*size for _ in range(size)]
+        
+        # 填充对角线子区域
+        for i in range(0, size, region_size):
+            nums = list(range(1, size+1))
+            random.shuffle(nums)
+            for x in range(region_size):
+                for y in range(region_size):
+                    grid[i+x][i+y] = nums[x*region_size + y]
+        
+        # 解数独
+        self._solve_sudoku(grid)
+        return grid
+
+    def _solve_sudoku(self, grid: List[List[int]]) -> bool:
+        """回溯法解数独"""
+        size = self.size
+        region_size = self.sqrt_n
+        empty = self._find_empty(grid)
+        
+        if not empty:
+            return True
+            
+        row, col = empty
+        for num in random.sample(range(1, size+1), size):  # 随机尝试增加多样性
+            if self._is_safe(grid, row, col, num):
+                grid[row][col] = num
+                if self._solve_sudoku(grid):
+                    return True
+                grid[row][col] = 0
+        return False
+
+    def _find_empty(self, grid: List[List[int]]) -> Optional[tuple]:
+        """寻找下一个空单元格"""
+        for i in range(self.size):
+            for j in range(self.size):
+                if grid[i][j] == 0:
+                    return (i, j)
+        return None
+
+    def _is_safe(self, grid: List[List[int]], row: int, col: int, num: int) -> bool:
+        """检查数字是否可以安全填入"""
+        size = self.size
+        region_size = self.sqrt_n
+        
+        # 检查行和列
+        if num in grid[row] or num in [grid[i][col] for i in range(size)]:
+            return False
+            
+        # 检查子区域
+        start_row, start_col = row - row%region_size, col - col%region_size
+        for i in range(region_size):
+            for j in range(region_size):
+                if grid[start_row+i][start_col+j] == num:
+                    return False
+        return True
+
+    def _dig_holes(self, grid: List[List[int]], dig_prob: float) -> List[List[int]]:
+        """挖洞生成谜题（保证至少有一个解）"""
+        size = self.size
+        for i in range(size):
+            for j in range(size):
+                if random.random() < dig_prob:
+                    grid[i][j] = 0
+        return grid