add llama-3.3-70b-instruct algebra, algorithmic eval configs

This commit is contained in:
Andreas Koepf 2025-02-25 23:07:46 +01:00
parent 92c8be1699
commit 6d5168d1e5
9 changed files with 62 additions and 0 deletions

View file

@ -1,4 +1,5 @@
model: anthropic/claude-3.7-sonnet # find model id: https://openrouter.ai/models
provider: Anthropic
category: test
datasets:
- YOUR_DATASET_NAME

View file

@ -0,0 +1,14 @@
model: meta-llama/llama-3.3-70b-instruct
provider: Hyperbolic
category: algebra
datasets:
- intermediate_integration
- polynomial_equations
- polynomial_multiplication
- simple_equations
- simple_integration
- complex_arithmetic
eval_dir: results/llama-3.3-70b-instruct
dataset_size: 50
dataset_seed: 42
developer_role: system

View file

@ -0,0 +1,41 @@
model: meta-llama/llama-3.3-70b-instruct
provider: Hyperbolic
category: algorithmic
datasets:
- ab
- base_conversion
- binary_alternation
- binary_matrix
- caesar_cipher
- count_primes
- cryptarithm
- game_of_life
- graph_color
- group_anagrams
- isomorphic_strings
- jugs
- letter_counting
- letter_jumble
- manipulate_matrix
- number_filtering
- number_sorting
- palindrome
- palindrome_partitioning
- pool_matrix
- ransom_note
- rotate_matrix
- rotten_oranges
- sentence_reordering
- spell_backward
- spiral_matrix
- string_insertion
- string_manipulation
- string_splitting
- string_synthesis
- word_ladder
- word_sequence_reversal
- word_sorting
eval_dir: results/llama-3.3-70b-instruct
dataset_size: 50
dataset_seed: 45
developer_role: system

View file

@ -1,4 +1,5 @@
model: deepseek/deepseek-r1
provider: Nebius
category: algebra
datasets:
- intermediate_integration

View file

@ -1,4 +1,5 @@
model: deepseek/deepseek-r1
provider: Nebius
category: algorithmic
datasets:
- ab

View file

@ -1,4 +1,5 @@
model: deepseek/deepseek-r1
provider: Nebius
category: cognition
datasets:
- color_cube_rotation

View file

@ -1,4 +1,5 @@
model: deepseek/deepseek-r1
provider: Nebius
category: logic
datasets:
- propositional_logic