mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-19 12:58:07 +00:00
parent
48f082663a
commit
29179f783e
2 changed files with 8 additions and 1 deletions
|
|
@ -15,6 +15,13 @@ from tenacity import AsyncRetrying, retry_if_exception_type, stop_after_attempt,
|
|||
import reasoning_gym
|
||||
from reasoning_gym.utils import extract_answer
|
||||
|
||||
# Configure logging
|
||||
logging.basicConfig(
|
||||
level=logging.INFO,
|
||||
format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
|
||||
handlers=[logging.StreamHandler()],
|
||||
)
|
||||
|
||||
|
||||
class OpenRouterEvaluator:
|
||||
def __init__(self, model: str, config: EvalConfig):
|
||||
|
|
|
|||
|
|
@ -25,7 +25,7 @@ datasets:
|
|||
- word_ladder
|
||||
- word_sequence_reversal
|
||||
- word_sorting
|
||||
eval_dir: eval/r1
|
||||
eval_dir: eval/sonnet-3.5
|
||||
dataset_size: 50
|
||||
dataset_seed: 45
|
||||
developer_role: system
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue