init-commit

2026-04-19 12:58:04 +00:00 · 2025-05-23 15:27:15 +08:00 · 2025-05-23 15:27:15 +08:00 · 18a552597a
commit 18a552597a
3461 changed files with 1150579 additions and 0 deletions
--- a/internbootcamp/bootcamp/kor_operation_unicode203b/kor_operation_unicode203b.py
+++ b/internbootcamp/bootcamp/kor_operation_unicode203b/kor_operation_unicode203b.py
@ -0,0 +1,449 @@
+"""# 谜题训练场开发任务
+
+## 任务概述
+你是一位资深程序员，我需要你帮我实现一个特定谜题的训练场环境类。这个类继承自`Basebootcamp`，用于生成谜题实例并验证解答。
+
+## 背景说明
+我正在开发一系列谜题训练场，每个训练场对应一个特定类型的谜题。训练场类命名为`{PuzzleName}bootcamp`，其中`PuzzleName`是谜题的名称。
+
+每个训练场类主要提供两个核心功能：
+1. 生成该谜题类型的问题实例
+2. 验证用户对问题的回答是否正确
+
+## 技术接口规范
+
+### 类方法实现要求
+
+```python
+from bootcamp import Basebootcamp
+
+class {PuzzleName}bootcamp(Basebootcamp):
+    def __init__(self, **params):
+        \"\"\"
+        请你自定义params，以保存该puzzle相关的参数，例如网格大小等，参数配有默认值
+        \"\"\"
+        pass
+    
+    def case_generator(self):
+        \"\"\"
+        生成谜题实例，提示：为保证谜题有解，可以先生成结果再对结果处理得到谜题
+        返回：一个可JSON序列化的字典（避免包含set等无法通过json.dumps处理的数据结构）
+        \"\"\"
+        pass
+    
+    @staticmethod
+    def prompt_func(question_case) -> str:
+        \"\"\"
+        将case_generator生成的谜题实例转换为文本形式的问题，问题中包含问题背景、对谜题规则的介绍、具体要解决的谜题实例、期望最终答案的格式，
+        例如：你是xxxx，请你解答yyyy，规则如下：yyyy，最终答案放置在：zzzzz
+        注意：请参照提供的谜题描述进行复述，规则应当描述详细，包括任务背景、具体任务操作规则、对题目格式和答案格式的含义介绍等，
+
+        参数:
+            question_case: 由case_generator生成的谜题实例
+            
+        返回:
+            str: 格式化的问题字符串
+            
+        注意:
+            1. 需考虑问题的格式，以便后续能正确提取
+            2. 问题描述中应包含期望的答案格式说明，以便后续能正确提取，为了避免抽取时匹配出干扰项，请要求模型将答案放在特定标签（如双括号）内，例如[[your answer here]]
+        \"\"\"
+        pass
+    
+    @staticmethod
+    def extract_output(output):
+        \"\"\"
+        从LLM的回复中提取符合格式要求的答案，如有多个，请抽取最后一个，避免使用re.search等只抽取第一个结果的方式。
+        
+        参数:
+            output: LLM的完整输出（包含原始问题和回答）
+            
+        返回:
+            提取的答案，若未找到符合格式的答案则返回None
+        \"\"\"
+        pass
+    
+    @classmethod
+    def _verify_correction(cls, solution, identity):
+        \"\"\"
+        验证提取的答案是否正确，注意一个问题可以能有多个解，按照谜题规则进行检验，不要直接匹配可能的答案。
+        
+        参数:
+            solution: extract_output提取的答案
+            identity: case_generator生成的谜题实例
+            
+        返回:
+            bool: 答案是否正确
+        \"\"\"
+        pass
+```
+
+### 验证评分方法（基类已实现）
+
+```python
+@classmethod
+def verify_score(cls, model_output, identity:dict, format_score=0.1) -> float:
+    \"\"\"
+    验证输出结果并评分。
+    
+    参数:
+        model_output: 模型的完整输出
+        identity: 谜题实例（由case_generator生成）
+        format_score: 答案格式正确时的基础分数
+    
+    返回:
+        float: 评分结果（0-1之间）
+    \"\"\"
+    score = 0. 
+    try:
+        extract_solution = cls.extract_output(model_output)
+        if extract_solution is None:
+            return score
+        else:
+            score = format_score # 格式正确时的基础分数
+        if cls._verify_correction(extract_solution, identity):
+            score = 1.  # 答案完全正确时的满分
+    except Exception as e:
+        # 处理异常情况
+        pass
+    return score
+```
+
+### 使用示例
+
+```python
+# 初始化谜题训练场
+bootcamp = Puzzlebootcamp()
+
+# 生成谜题实例
+case = bootcamp.case_generator()
+
+# 将谜题转换为文本问题
+prompt = Puzzlebootcamp.prompt_func(case)
+
+# 获取LLM对问题的解答
+response = get_response(prompt, \"LLM\")
+
+# 从完整对话中提取答案
+extracted_output = Puzzlebootcamp.extract_output(prompt + response)
+
+# 验证答案并评分
+score = Puzzlebootcamp.verify_score(extracted_output, case)
+```
+
+## 你的任务
+请根据以下谜题描述（谜题描述可能不完整，请先结合你的知识澄清规则），实现一个完整的谜题训练场类：
+
+### 谜题描述
+Define an operation such that when a is a multiple of b, a※b = a/b + 2.
+When b is a multiple of a, a※b = b/a + 2.
+If a is not a multiple of b and b is not a multiple of a, a※b = 24.
+Both a and b are integers.Example questions are as follows:
+
+<example 0>
+Compute 4※7.
+Please ensure the answer is a single number and wrap it in double square brackets, like this: [[your answer]].
+</example 0>
+
+<example 1>
+Compute 25※5※14.
+Please ensure the answer is a single number and wrap it in double square brackets, like this: [[your answer]].
+</example 1>
+
+<example 2>
+Compute 19※28※31※(286※13).
+Please ensure the answer is a single number and wrap it in double square brackets, like this: [[your answer]].
+</example 2>
+
+<example 3>
+Compute 19※28※4※(104※13).
+Please ensure the answer is a single number and wrap it in double square brackets, like this: [[your answer]].
+</example 3>
+
+<example 4>
+If X※14=5, find X.
+Please ensure the answer is a single number and wrap it in double square brackets, like this: [[your answer]].
+</example 4>
+
+<example 5>
+If 25※X※14=4, find X.
+When providing your answer, please enclose it in double square brackets, like this: [[answer]]. 
+If there is more than one correct answer, separate the answers with 'or', like this: [[1or2]].
+</example 5>
+
+<example 6>
+If 25※5※X=4, find X.
+When providing your answer, please enclose it in double square brackets, like this: [[answer]]. 
+If there is more than one correct answer, separate the answers with 'or', like this: [[1or2]].
+</example 6>
+
+<example 7>
+If 19※28※4※(X※13) =3, find X.
+When providing your answer, please enclose it in double square brackets, like this: [[answer]]. 
+If there is more than one correct answer, separate the answers with 'or', like this: [[1or2]].
+</example 7>
+
+<example 8>
+Now we make a little change to the rule: when a is a multiple of b, a ※ b = a / b + C; when b is a multiple of a, a ※ b = b / a + C; if a is not a multiple of b, b is not a multiple of a, a ※ b = 24, where C is a parameter.
+Given that: 25 ※ 5 = 8, find C.
+The answer should only be given as a number.
+Please wrap the answer in double square brackets, like this: [[your answer]].
+</example 8>
+
+<example 9>
+Now we make a little change to the rule: when a is a multiple of b, a ※ b = a / b + C; when b is a multiple of a, a ※ b = b / a + C; if a is not a multiple of b, b is not a multiple of a, a ※ b = 24, where C is a parameter.
+Given that: 14※42=4,find C.
+The answer should only be given as a number.
+Please wrap the answer in double square brackets, like this: [[your answer]].
+</example 9>
+
+
+请完成上述谜题的训练场环境类实现，包括所有必要的方法。
+"""
+
+from bootcamp import Basebootcamp
+import json
+import random
+import re
+from bootcamp import Basebootcamp
+
+class KorOperationUnicode203bbootcamp(Basebootcamp):
+    def __init__(self, C=2, max_operand=100, max_attempts=100, **params):
+        super().__init__(**params)
+        self.C = C
+        self.max_operand = max_operand
+        self.max_attempts = max_attempts
+
+    def case_generator(self):
+        problem_type = random.choices(
+            ['compute', 'solve_x', 'solve_c'],
+            weights=[5, 3, 2],
+            k=1
+        )[0]
+        
+        try:
+            if problem_type == 'compute':
+                return self._generate_compute_case()
+            elif problem_type == 'solve_x':
+                return self._generate_solve_x_case()
+            elif problem_type == 'solve_c':
+                return self._generate_solve_c_case()
+        except Exception as e:
+            # 异常时返回默认计算题
+            return self._generate_compute_case()
+
+    def _generate_compute_case(self):
+        for _ in range(self.max_attempts):
+            num_operands = random.choices([2,3,4], weights=[5,3,1])[0]
+            operands = [random.randint(1, self.max_operand) for _ in range(num_operands)]
+            
+            try:
+                current_value = operands[0]
+                for op in operands[1:]:
+                    current_value = self._compute_operation(current_value, op, self.C)
+            except ZeroDivisionError:
+                continue
+            
+            # 允许有限概率生成结果为24的题目
+            if current_value !=24 or random.random() < 0.2:
+                return {
+                    'type': 'compute',
+                    'expression': operands,
+                    'C': self.C,
+                    'answer': int(current_value)
+                }
+        
+        # 保底返回简单计算题
+        return {
+            'type': 'compute',
+            'expression': [4,7],
+            'C': self.C,
+            'answer': 24
+        }
+
+    def _compute_operation(self, a, b, C):
+        if b == 0 or a == 0:
+            return 24
+        if a % b == 0:
+            return (a // b) + C
+        if b % a == 0:
+            return (b // a) + C
+        return 24
+
+    def _generate_solve_x_case(self):
+        for _ in range(self.max_attempts):
+            # 随机选择生成方向
+            if random.random() < 0.5:  # 生成 a※X=...
+                a = random.randint(2, self.max_operand)
+                delta = random.randint(1, 5)
+                target = self.C + delta
+                solutions = []
+                
+                # 寻找所有可能的X解
+                for X in range(1, self.max_operand*2):
+                    try:
+                        if self._compute_operation(a, X, self.C) == target:
+                            solutions.append(X)
+                    except:
+                        continue
+                
+                if solutions:
+                    return {
+                        'type': 'solve_x',
+                        'equation': f"{a}※X={target}",
+                        'solutions': solutions,
+                        'C': self.C
+                    }
+            else:  # 生成 X※a=...
+                a = random.randint(2, self.max_operand)
+                delta = random.randint(1, 5)
+                target = self.C + delta
+                solutions = []
+                
+                for X in range(1, self.max_operand*2):
+                    try:
+                        if self._compute_operation(X, a, self.C) == target:
+                            solutions.append(X)
+                    except:
+                        continue
+                
+                if solutions:
+                    return {
+                        'type': 'solve_x',
+                        'equation': f"X※{a}={target}",
+                        'solutions': solutions,
+                        'C': self.C
+                    }
+        
+        # 保底返回单解问题
+        return {
+            'type': 'solve_x',
+            'equation': "X※4=6",
+            'solutions': [8],  # 8※4=2+2=4?
+            'C': self.C
+        }
+
+    def _generate_solve_c_case(self):
+        for _ in range(self.max_attempts):
+            # 随机生成方向
+            if random.random() < 0.5:
+                a = random.randint(1, self.max_operand)
+                factor = random.randint(2, 5)
+                b = a * factor
+                expected = factor + self.C  # a※b = b/a + C
+            else:
+                b = random.randint(1, self.max_operand)
+                factor = random.randint(2, 5)
+                a = b * factor
+                expected = factor + self.C  # a※b = a/b + C
+            
+            # 避免除零错误
+            if a == 0 or b == 0:
+                continue
+            
+            return {
+                'type': 'solve_c',
+                'equation': f"{a}※{b}={expected}",
+                'answer': self.C
+            }
+        
+        # 保底返回
+        return {
+            'type': 'solve_c',
+            'equation': "25※5=8",
+            'answer': 3  # 25/5=5 +3=8
+        }
+
+    @staticmethod
+    def prompt_func(question_case):
+        # 统一规则描述
+        if 'C' in question_case and question_case['C'] != 2:
+            rule_desc = [
+                "We define a special operation ※ with parameter C:",
+                "- If a is a multiple of b: a ※ b = a/b + C",
+                "- If b is a multiple of a: a ※ b = b/a + C",
+                "- Otherwise: a ※ b = 24"
+            ]
+        else:
+            rule_desc = [
+                "We define a special operation ※ with these rules:",
+                "- When a is a multiple of b: a ※ b = a/b + 2",
+                "- When b is a multiple of a: a ※ b = b/a + 2",
+                "- If neither is a multiple: a ※ b = 24"
+            ]
+        
+        task_desc = ""
+        if question_case['type'] == 'compute':
+            expr = '※'.join(map(str, question_case['expression']))
+            task_desc = f"Compute the value of {expr}."
+            format_note = "Put your final answer in [[ ]] as a single number."
+        elif question_case['type'] == 'solve_x':
+            task_desc = f"Solve the equation: {question_case['equation']}"
+            if len(question_case['solutions']) > 1:
+                format_note = "Put all possible solutions in [[ ]] separated by 'or', e.g., [[2or5]]."
+            else:
+                format_note = "Put your answer in [[ ]] as a single number."
+        elif question_case['type'] == 'solve_c':
+            task_desc = f"Determine parameter C from equation: {question_case['equation']}"
+            format_note = "Put your answer in [[ ]] as a single number."
+        
+        return (
+            '\n'.join(rule_desc) + '\n\n' +
+            f'Problem: {task_desc}\n' +
+            f'Format Requirement: {format_note}'
+        )
+
+    @staticmethod
+    def extract_output(output):
+        matches = re.findall(r'\[\[(.*?)\]\]', output)
+        if not matches:
+            return None
+        last_match = matches[-1].strip()
+        # 清理多余内容
+        cleaned = re.sub(r'[^0-9or]', '', last_match.lower())
+        return cleaned if cleaned else None
+
+    @classmethod
+    def _verify_correction(cls, solution, identity):
+        if solution is None:
+            return False
+        
+        try:
+            if identity['type'] == 'compute':
+                return int(solution) == identity['answer']
+            
+            elif identity['type'] == 'solve_x':
+                # 处理多格式输入
+                parts = re.split(r'\bor\b|,', solution)
+                answers = set()
+                for p in parts:
+                    p = p.strip()
+                    if p.isdigit():
+                        answers.add(int(p))
+                return answers == set(identity['solutions'])
+            
+            elif identity['type'] == 'solve_c':
+                return int(solution) == identity['answer']
+            
+            return False
+        except Exception as e:
+            return False
+
+# 测试代码
+if __name__ == "__main__":
+    bootcamp = KorOperationUnicode203bbootcamp()
+    for _ in range(3):
+        case = bootcamp.case_generator()
+        print("Generated Case:")
+        print(json.dumps(case, indent=2))
+        
+        prompt = KorOperationUnicode203bbootcamp.prompt_func(case)
+        print("\nPrompt:\n", prompt)
+        
+        # 测试验证逻辑
+        test_solution = "[[7]]" if case['type'] == 'compute' else "[[3or5]]"
+        print("\nTest verification:", bootcamp._verify_correction(
+            KorOperationUnicode203bbootcamp.extract_output(test_solution),
+            case
+        ))
+        print("="*50)