init-commit

2026-04-22 16:49:04 +00:00 · 2025-05-23 15:27:15 +08:00 · 2025-05-23 15:27:15 +08:00 · 18a552597a
commit 18a552597a
3461 changed files with 1150579 additions and 0 deletions
--- a/internbootcamp/bootcamp/kor_logic_predicate_logic_formalization/kor_logic_predicate_logic_formalization.py
+++ b/internbootcamp/bootcamp/kor_logic_predicate_logic_formalization/kor_logic_predicate_logic_formalization.py
@ -0,0 +1,527 @@
+"""# 谜题训练场开发任务
+
+## 任务概述
+你是一位资深程序员，我需要你帮我实现一个特定谜题的训练场环境类。这个类继承自`Basebootcamp`，用于生成谜题实例并验证解答。
+
+## 背景说明
+我正在开发一系列谜题训练场，每个训练场对应一个特定类型的谜题。训练场类命名为`{PuzzleName}bootcamp`，其中`PuzzleName`是谜题的名称。
+
+每个训练场类主要提供两个核心功能：
+1. 生成该谜题类型的问题实例
+2. 验证用户对问题的回答是否正确
+
+## 技术接口规范
+
+### 类方法实现要求
+
+```python
+from bootcamp import Basebootcamp
+
+class {PuzzleName}bootcamp(Basebootcamp):
+    def __init__(self, **params):
+        \"\"\"
+        请你自定义params，以保存该puzzle相关的参数，例如网格大小等，参数配有默认值
+        \"\"\"
+        pass
+    
+    def case_generator(self):
+        \"\"\"
+        生成谜题实例，提示：为保证谜题有解，可以先生成结果再对结果处理得到谜题
+        返回：一个可JSON序列化的字典（避免包含set等无法通过json.dumps处理的数据结构）
+        \"\"\"
+        pass
+    
+    @staticmethod
+    def prompt_func(question_case) -> str:
+        \"\"\"
+        将case_generator生成的谜题实例转换为文本形式的问题，问题中包含问题背景、对谜题规则的介绍、具体要解决的谜题实例、期望最终答案的格式，
+        例如：你是xxxx，请你解答yyyy，规则如下：yyyy，最终答案放置在：zzzzz
+        注意：请参照提供的谜题描述进行复述，规则应当描述详细，包括任务背景、具体任务操作规则、对题目格式和答案格式的含义介绍等，
+
+        参数:
+            question_case: 由case_generator生成的谜题实例
+            
+        返回:
+            str: 格式化的问题字符串
+            
+        注意:
+            1. 需考虑问题的格式，以便后续能正确提取
+            2. 问题描述中应包含期望的答案格式说明，以便后续能正确提取，为了避免抽取时匹配出干扰项，请要求模型将答案放在特定标签（如双括号）内，例如[[your answer here]]
+        \"\"\"
+        pass
+    
+    @staticmethod
+    def extract_output(output):
+        \"\"\"
+        从LLM的回复中提取符合格式要求的答案，如有多个，请抽取最后一个，避免使用re.search等只抽取第一个结果的方式。
+        
+        参数:
+            output: LLM的完整输出（包含原始问题和回答）
+            
+        返回:
+            提取的答案，若未找到符合格式的答案则返回None
+        \"\"\"
+        pass
+    
+    @classmethod
+    def _verify_correction(cls, solution, identity):
+        \"\"\"
+        验证提取的答案是否正确，注意一个问题可以能有多个解，按照谜题规则进行检验，不要直接匹配可能的答案。
+        
+        参数:
+            solution: extract_output提取的答案
+            identity: case_generator生成的谜题实例
+            
+        返回:
+            bool: 答案是否正确
+        \"\"\"
+        pass
+```
+
+### 验证评分方法（基类已实现）
+
+```python
+@classmethod
+def verify_score(cls, model_output, identity:dict, format_score=0.1) -> float:
+    \"\"\"
+    验证输出结果并评分。
+    
+    参数:
+        model_output: 模型的完整输出
+        identity: 谜题实例（由case_generator生成）
+        format_score: 答案格式正确时的基础分数
+    
+    返回:
+        float: 评分结果（0-1之间）
+    \"\"\"
+    score = 0. 
+    try:
+        extract_solution = cls.extract_output(model_output)
+        if extract_solution is None:
+            return score
+        else:
+            score = format_score # 格式正确时的基础分数
+        if cls._verify_correction(extract_solution, identity):
+            score = 1.  # 答案完全正确时的满分
+    except Exception as e:
+        # 处理异常情况
+        pass
+    return score
+```
+
+### 使用示例
+
+```python
+# 初始化谜题训练场
+bootcamp = Puzzlebootcamp()
+
+# 生成谜题实例
+case = bootcamp.case_generator()
+
+# 将谜题转换为文本问题
+prompt = Puzzlebootcamp.prompt_func(case)
+
+# 获取LLM对问题的解答
+response = get_response(prompt, \"LLM\")
+
+# 从完整对话中提取答案
+extracted_output = Puzzlebootcamp.extract_output(prompt + response)
+
+# 验证答案并评分
+score = Puzzlebootcamp.verify_score(extracted_output, case)
+```
+
+## 你的任务
+请根据以下谜题描述（谜题描述可能不完整，请先结合你的知识澄清规则），实现一个完整的谜题训练场类：
+
+### 谜题描述
+Universal Quantifier: Use Ax to denote \"for all x\".
+Existential Quantifier: Use Ex to denote \"there exists some x\".
+
+Logical Connectives:
+Conjunction: Use &
+Disjunction: Use |
+Implication: Use ⇒
+Negation: Use ∼
+
+In general, a predicate P with n (n > 1) individual variables is called an n-ary predicate, denoted as P(x1, x2, ..., xn). When n = 1, P(x) denotes the property P; when n ≥ 2, P(x1, x2, ..., xn) denotes the relationship P among x1, x2, ..., xn.
+
+Predicates without individual variables are called 0-ary predicates. For example, F(a), G(a, b), P(a1, ..., an) are all 0-ary predicates.
+
+Let D be the domain of individuals.
+\"All x in D have property F\" is symbolized as AxF(x).
+\"Some x in D have property F\" is symbolized as ExF(x).
+\"For all x in D, if x has property F, then x has property G\" is symbolized as Ax(F(x) ⇒ G(x)).
+\"Some x in D have both properties F and G\" is symbolized as Ex(F(x) & G(x)).
+\"For all x, y in D, if x has property F and y has property G, then x and y have relationship H\" is symbolized as AxAy(F(x) & F(y) ⇒ H(x, y)).
+\"For all x in D, if x has property F, then there exists some y with property G such that x and y have relationship H\" is symbolized as Ax(F(x) ⇒ Ey(G(y) & H(x, y))).
+\"There exists some x in D with property F, and for all y in D, if y has property G, then x and y have relationship H\" is symbolized as Ex(F(x) & Ay(G(y) ⇒ H(x, y))).Example questions are as follows:
+
+<example 0>
+In first-order logic, symbolize the following propositions using 0-ary predicates:
+(1) Only 2 is a prime number, 4 is a composite number.
+(2) If 5 is greater than 4, then 4 is greater than 6.
+
+For (1), define a unary predicate F(x): x is a prime number. 
+The proposition can be symbolized as?
+
+For (2), define a binary predicate G(x, y): x > y. 
+The proposition can be symbolized as?
+
+Please provide the answers in the format [[];[]].
+</example 0>
+
+<example 1>
+In individual domains limited to (a) and (b) conditions, symbolize the following two propositions:
+(1) All humans breathe.
+(2) Some people write with their left hand.
+Where:
+(a) Individual domain D1 is the set of humans.
+(b) Individual domain D2 is the universal domain.
+
+(a) 
+Let F(x): x breathes.
+G(x): x writes with their left hand.
+In D1, apart from humans, there is nothing else,
+thus (1) symbolizes as? (2) symbolizes as?
+
+(b) 
+In D2, besides humans, there are all things, 
+so when symbolizing, humans must be separated first. 
+Introduce predicate M(x): x is a human. 
+In D2, clarify (1) and (2) as follows:
+(1) For all individuals in the universe, if the individual is human, then they breathe.
+(2) There exists an individual in the universe who writes with their left hand (or more precisely, there exists such an individual who is human and writes with their left hand).
+
+Therefore, (1) symbolizes as?(2) symbolizes as?
+
+Please provide the answers in the format [[];[];[];[]].
+</example 1>
+
+<example 2>
+Symbolize the following propositions:
+(1) All humans have black hair.
+(2) Some people have been to the moon.
+(3) No one has been to Jupiter.
+(4) Students studying in the United States are not necessarily Asian.
+
+Using the universal domain.
+Let M(x): x is a human,
+(1) Let F(x): x has black hair. Proposition (1) symbolizes as?
+(2) Let G(x): x has been to the moon. Proposition (2) symbolizes as?
+(3) Let H(x): x has been to Jupiter. Proposition (3) symbolizes as?
+(4) Let F(x): x studies in the United States, G(x): x is Asian. Proposition (4) symbolizes as?
+
+Please provide the answers in the format [[];[];[];[]].
+</example 2>
+
+<example 3>
+Using the universal domain, symbolize the proposition:
+Some rabbits run faster than all turtles.
+
+Let F(x): x is a rabbit,
+G(y): y is a turtle,
+H(x,y): x runs faster than y,
+L(x,y): x runs equally fast as y.
+
+Thus, this proposition can be symbolized as?
+
+Please provide the answer in the format [[]].
+</example 3>
+
+<example 4>
+Given the domain of individuals as the set of natural numbers(N),
+F(x): x is even,
+G(x): x is prime,
+
+Using 0-ary predicates, symbolize the following propositions:
+(1) 2 is an even prime number.
+(2) If 2 is prime, then 4 is not prime.
+(3) Only 2 is prime, for 6 to be prime.
+(4) Unless 6 is prime, 4 is prime.
+
+Please provide the answers in the format [[];[];[];[]].
+</example 4>
+
+<example 5>
+Let the domain of individuals be D = {0, 1, 2, ..., 10}. 
+Symbolize the following propositions:
+
+(1) All even numbers in D are divisible by 2.
+(2) Some even numbers in D are multiples of 4.
+
+For (1), using predicates:
+G(x): x is even,
+H(x): x is divisible by 2,
+(1) can be symbolized as?
+
+For (2), using predicates:
+G(x): x is even,
+R(x): x is a multiple of 4,
+(2) can be symbolized as?
+
+Please provide the answers in the format [[];[]].
+</example 5>
+
+<example 6>
+Let the domain of individuals be D = {x |x is a person}.
+Symbolize the following propositions:
+
+(1) All Chinese people use chopsticks to eat.
+(2) Some Americans do not live in the United States.
+
+For (1), using predicates:
+F(x): x is Chinese,
+G(x): x uses chopsticks to eat,
+(1) can be symbolized as?
+
+For (2), using predicates:
+F(x): x is American,
+G(x): x lives in the United States,
+(2) can be symbolized as?
+
+Please provide the answers in the format [[];[]].
+</example 6>
+
+<example 7>
+Using the universal domain of individuals, symbolize the following propositions:
+
+(1) Any even number x and y have a common divisor greater than 1.
+(2) There exist odd numbers x and y that do not have a common divisor greater than 1.
+(3) It is true that some trains are faster than all cars.
+
+For (1), using predicates:
+F(x): x is even,
+H(x,y): x and y have a common divisor greater than 1,
+(1) can be symbolized as?
+
+For (2), using predicates:
+G(x): x is odd,
+H(x,y): x and y have a common divisor greater than 1,
+(2) can be symbolized as?
+
+For (3), using predicates:
+F(x): x is a train,
+G(y): y is a car,
+H(x,y): x is faster than y,
+(3) can be symbolized as?
+
+Please provide the answers in the format [[];[];[]].
+</example 7>
+
+<example 8>
+Using the domain of individuals as the set of integers Z, 
+symbolize the following statement:
+\"For any x and y, there exists a z such that x + y = z.\"
+Let H(x, y, z) denote x + y = z. 
+How can this be symbolized?
+
+Please provide the answer in the format [[]].
+</example 8>
+
+<example 9>
+Using the domain of individuals as the set of real numbers R, 
+symbolize the following proposition:
+\"For every ε > 0, there exists λ > 0 such that whenever |x - x0| < λ, it holds that |f(x) - f(x0)| < ε.\"
+
+Let L(x): x > 0,
+M(x, y, z): |x - y| < z,
+N(x, y, z): |f(x) - f(y)| < z.
+
+How can this be symbolized?
+
+Please provide the answer in the format [[]].
+</example 9>
+
+
+请完成上述谜题的训练场环境类实现，包括所有必要的方法。
+"""
+
+from bootcamp import Basebootcamp
+import re
+import random
+from collections import OrderedDict
+from bootcamp import Basebootcamp
+
+class KorLogicPredicateLogicFormalizationbootcamp(Basebootcamp):
+    def __init__(self, num_problems=3, max_quantifiers=3):
+        self.num_problems = num_problems
+        self.max_quantifiers = max_quantifiers
+        self.problem_templates = [
+            self._create_universal_implication,
+            self._create_existential_conjunction,
+            self._create_0ary_predicate,
+            self._create_nested_quantifiers,
+            self._create_negation_case,
+            self._create_multiple_quantifiers
+        ]
+
+    def case_generator(self):
+        problems = []
+        selected_templates = random.choices(self.problem_templates, k=self.num_problems)
+        
+        for template in selected_templates:
+            problems.append(template())
+        
+        return {
+            "problems": problems,
+            "answer_format": f"[[{';'.join(['answer']*self.num_problems)}]]"
+        }
+
+    @staticmethod
+    def prompt_func(question_case):
+        prompt = """In first-order logic, symbolize the following propositions using the given predicates.
+Strictly follow these notation rules:
+- Universal Quantifier: Ax (for all x)
+- Existential Quantifier: Ex (there exists x)
+- Logical Connectives: & (and), | (or), ⇒ (implies), ∼ (not)
+- Predicate format: Use capitalized letters with variables (e.g., F(x), G(x,y))
+- 0-ary predicates must use constants (e.g., F(a), G(b,c))
+
+"""
+        for idx, problem in enumerate(question_case["problems"], 1):
+            prompt += f"\nProblem {idx}: {problem['description']}\n"
+            prompt += "Predicates:\n"
+            for pred, definition in OrderedDict(sorted(problem["predicates"].items())).items():
+                prompt += f"- {pred}: {definition}\n"
+        
+        prompt += "\nProvide answers in [[answer1;answer2;...]] format exactly as required."
+        return prompt
+
+    @staticmethod
+    def extract_output(output):
+        matches = re.findall(r'\[\[(.*?)\]\]', output, flags=re.DOTALL)
+        if not matches:
+            return None
+        last_match = matches[-1].replace('\n', ' ').strip()
+        return [s.strip() for s in last_match.split(';') if s.strip()]
+
+    @classmethod
+    def _verify_correction(cls, solution, identity):
+        try:
+            if not isinstance(solution, list) or len(solution) != len(identity["problems"]):
+                return False
+            return all(
+                cls._normalize(sol) == cls._normalize(prob["correct_answer"])
+                for sol, prob in zip(solution, identity["problems"])
+            )
+        except Exception:
+            return False
+
+    @staticmethod
+    def _normalize(expr):
+        return expr.replace(' ', '').upper()
+
+    # Enhanced problem generators
+    def _create_universal_implication(self):
+        domain_map = {
+            "humans": ["breathe", "are mortal"],
+            "students": ["study hard", "attend classes"],
+            "prime numbers": ["are even", "are greater than 2"],
+            "birds": ["fly", "have feathers"],
+        }
+        subject, conditions = random.choice(list(domain_map.items()))
+        condition = random.choice(conditions)
+        
+        return {
+            "description": f"Using universal domain: All {subject} {condition}.",
+            "predicates": {
+                "F(x)": f"x is a {subject}",
+                "G(x)": f"x {condition}"
+            },
+            "correct_answer": "Ax(F(x)⇒G(x))"
+        }
+
+    def _create_existential_conjunction(self):
+        entities = {
+            "rabbits": ["run fast", "have long ears"],
+            "cars": ["are red", "have turbo engines"],
+            "apples": ["are sweet", "are organic"],
+            "turtles": ["swim slowly", "have hard shells"],
+        }
+        subject, properties = random.choice(list(entities.items()))
+        prop = random.choice(properties)
+        
+        return {
+            "description": f"Using universal domain: Some {subject} {prop}.",
+            "predicates": {
+                "F(x)": f"x is a {subject}",
+                "G(x)": f"x {prop}"
+            },
+            "correct_answer": "Ex(F(x)&G(x))"
+        }
+
+    def _create_0ary_predicate(self):
+        constants = ["a", "b", "c", "d"]
+        templates = [
+            ("{c} is both {p1} and {p2}", "&"),
+            ("If {c1} is {p} then {c2} is {p}", "⇒"),
+            ("Either {c1} is {p} or {c2} is {p}", "|"),
+            ("Neither {c1} nor {c2} is {p}", "∼{0}&∼{1}")
+        ]
+        template, conn = random.choice(templates)
+        
+        if template.count("{c}") == 1:
+            c = random.choice(constants)
+            p1, p2 = random.sample(["F", "G", "H"], 2)
+            return {
+                "description": template.format(c=c, p1=p1, p2=p2),
+                "predicates": {
+                    f"{p1}({c})": f"{c} has property {p1}",
+                    f"{p2}({c})": f"{c} has property {p2}"
+                },
+                "correct_answer": f"{p1}({c}){conn}{p2}({c})"
+            }
+        else:
+            c1, c2 = random.sample(constants, 2)
+            p = random.choice(["F", "G"])
+            if "Neither" in template:
+                answer = conn.format(f"{p}({c1})", f"{p}({c2})")
+            else:
+                answer = f"{p}({c1}){conn}{p}({c2})"
+            return {
+                "description": template.format(c1=c1, c2=c2, p=p),
+                "predicates": {
+                    f"{p}({c1})": f"{c1} has property {p}",
+                    f"{p}({c2})": f"{c2} has property {p}"
+                },
+                "correct_answer": answer
+            }
+
+    def _create_nested_quantifiers(self):
+        relations = {
+            "faster than": ["rabbits", "turtles"],
+            "smarter than": ["humans", "animals"],
+            "older than": ["students", "teachers"],
+        }
+        rel_desc, (subject, obj) = random.choice(list(relations.items()))
+        
+        return {
+            "description": f"Symbolize: Some {subject} are {rel_desc} all {obj}.",
+            "predicates": {
+                "F(x)": f"x is a {subject}",
+                "G(y)": f"y is a {obj}",
+                "H(x,y)": f"x is {rel_desc} y"
+            },
+            "correct_answer": "Ex(F(x)&Ay(G(y)⇒H(x,y)))"
+        }
+
+    # New problem types
+    def _create_negation_case(self):
+        return {
+            "description": "No humans can fly. (Using universal domain)",
+            "predicates": {
+                "F(x)": "x is human",
+                "G(x)": "x can fly"
+            },
+            "correct_answer": "Ax(F(x)⇒∼G(x))"
+        }
+
+    def _create_multiple_quantifiers(self):
+        return {
+            "description": "Every person has someone they love. (Domain: people)",
+            "predicates": {
+                "F(x,y)": "x loves y"
+            },
+            "correct_answer": "AxEyF(x,y)"
+        }