mirror of
https://github.com/open-thought/reasoning-gym.git
synced 2026-04-19 12:58:07 +00:00
210 lines
5.6 KiB
Python
210 lines
5.6 KiB
Python
"""Tests for Manipulate Matrix questions generation"""
|
|
|
|
import pytest
|
|
|
|
from reasoning_gym.algorithmic.manipulate_matrix import ManipulateMatrixConfig, ManipulateMatrixDataset
|
|
|
|
|
|
def test_manipulate_matrix_config_validation():
|
|
"""Test that invalid configs raise appropriate errors"""
|
|
|
|
invalid_dims = [-1, 0] # Dimensions should be positive integers
|
|
dim_fields = ["max_rows", "max_cols"]
|
|
|
|
for field in dim_fields:
|
|
for dim in invalid_dims:
|
|
with pytest.raises(AssertionError):
|
|
config = ManipulateMatrixConfig(**{field: dim})
|
|
config.validate()
|
|
|
|
invalid_probabilities = [-0.01, 1.01] # Probabilities should be between 0 and 1 inclusive
|
|
probability_fields = [
|
|
"p_hmirror",
|
|
"p_vmirror",
|
|
"p_dmirror",
|
|
"p_cmirror",
|
|
"p_map",
|
|
"p_crop",
|
|
"p_remove_every_nth_row",
|
|
"p_remove_every_nth_col",
|
|
"p_zero_divisible",
|
|
]
|
|
|
|
for field in probability_fields:
|
|
for prob in invalid_probabilities:
|
|
with pytest.raises(AssertionError):
|
|
config = ManipulateMatrixConfig(**{field: prob})
|
|
config.validate()
|
|
|
|
|
|
def test_manipulate_matrix_dataset_deterministic():
|
|
"""Test that dataset generates same items with same seed"""
|
|
config = ManipulateMatrixConfig(seed=42, size=10)
|
|
dataset1 = ManipulateMatrixDataset(config)
|
|
dataset2 = ManipulateMatrixDataset(config)
|
|
|
|
for i in range(len(dataset1)):
|
|
assert dataset1[i] == dataset2[i]
|
|
|
|
|
|
def test_manipulate_matrix_dataset_items():
|
|
"""Test basic properties of generated items"""
|
|
config = ManipulateMatrixConfig(max_rows=7, max_cols=7, size=10, seed=42)
|
|
dataset = ManipulateMatrixDataset(config)
|
|
|
|
for i in range(len(dataset)):
|
|
item = dataset[i]
|
|
# Check item structure
|
|
assert isinstance(item, dict)
|
|
assert "question" in item
|
|
assert "answer" in item
|
|
assert "metadata" in item
|
|
|
|
# Check metadata
|
|
assert "matrix" in item["metadata"]
|
|
assert "solution" in item["metadata"]
|
|
assert "operations" in item["metadata"]
|
|
|
|
matrix = item["metadata"]["matrix"]
|
|
solution = item["metadata"]["solution"]
|
|
operations = item["metadata"]["operations"]
|
|
|
|
# Verify matrix dimensions
|
|
assert len(matrix) <= config.max_rows
|
|
assert all(len(row) <= config.max_cols for row in matrix)
|
|
assert len(solution) <= config.max_rows
|
|
assert all(len(row) <= config.max_cols for row in solution)
|
|
for op in operations:
|
|
assert "transform" in op
|
|
assert "instruction" in op
|
|
|
|
|
|
def test_manipulate_matrix_dataset_iteration():
|
|
"""Test that iteration respects dataset size"""
|
|
config = ManipulateMatrixConfig(size=5, seed=42)
|
|
dataset = ManipulateMatrixDataset(config)
|
|
|
|
items = list(dataset)
|
|
assert len(items) == config.size
|
|
|
|
assert items == list(dataset)
|
|
|
|
|
|
def test_manipulate_matrix_transforms():
|
|
"""Test the _get_rotated method"""
|
|
config = ManipulateMatrixConfig(seed=42)
|
|
dataset = ManipulateMatrixDataset(config)
|
|
matrix = [
|
|
[1, 2, 3, 4, 5],
|
|
[6, 7, 8, 9, 10],
|
|
[11, 12, 13, 14, 15],
|
|
[16, 17, 18, 19, 20],
|
|
[21, 22, 23, 24, 25],
|
|
]
|
|
|
|
# identity
|
|
assert dataset._identity(matrix) == matrix
|
|
|
|
# rot 90 degrees
|
|
assert dataset._rot90(matrix) == [
|
|
[21, 16, 11, 6, 1],
|
|
[22, 17, 12, 7, 2],
|
|
[23, 18, 13, 8, 3],
|
|
[24, 19, 14, 9, 4],
|
|
[25, 20, 15, 10, 5],
|
|
]
|
|
|
|
# rot 180 degrees
|
|
assert dataset._rot180(matrix) == [
|
|
[25, 24, 23, 22, 21],
|
|
[20, 19, 18, 17, 16],
|
|
[15, 14, 13, 12, 11],
|
|
[10, 9, 8, 7, 6],
|
|
[5, 4, 3, 2, 1],
|
|
]
|
|
|
|
# rot 270 degrees
|
|
assert dataset._rot270(matrix) == [
|
|
[5, 10, 15, 20, 25],
|
|
[4, 9, 14, 19, 24],
|
|
[3, 8, 13, 18, 23],
|
|
[2, 7, 12, 17, 22],
|
|
[1, 6, 11, 16, 21],
|
|
]
|
|
|
|
# hmirror
|
|
assert dataset._hmirror(matrix) == [
|
|
[21, 22, 23, 24, 25],
|
|
[16, 17, 18, 19, 20],
|
|
[11, 12, 13, 14, 15],
|
|
[6, 7, 8, 9, 10],
|
|
[1, 2, 3, 4, 5],
|
|
]
|
|
|
|
# vmirror
|
|
assert dataset._vmirror(matrix) == [
|
|
[5, 4, 3, 2, 1],
|
|
[10, 9, 8, 7, 6],
|
|
[15, 14, 13, 12, 11],
|
|
[20, 19, 18, 17, 16],
|
|
[25, 24, 23, 22, 21],
|
|
]
|
|
|
|
# dmirror
|
|
assert dataset._dmirror(matrix) == [
|
|
[1, 6, 11, 16, 21],
|
|
[2, 7, 12, 17, 22],
|
|
[3, 8, 13, 18, 23],
|
|
[4, 9, 14, 19, 24],
|
|
[5, 10, 15, 20, 25],
|
|
]
|
|
|
|
# cmirror
|
|
assert dataset._cmirror(matrix) == [
|
|
[25, 20, 15, 10, 5],
|
|
[24, 19, 14, 9, 4],
|
|
[23, 18, 13, 8, 3],
|
|
[22, 17, 12, 7, 2],
|
|
[21, 16, 11, 6, 1],
|
|
]
|
|
|
|
# map
|
|
assert dataset._map(matrix, a=13, b=0) == [
|
|
[1, 2, 3, 4, 5],
|
|
[6, 7, 8, 9, 10],
|
|
[11, 12, 0, 14, 15], # 13 -> 0
|
|
[16, 17, 18, 19, 20],
|
|
[21, 22, 23, 24, 25],
|
|
]
|
|
|
|
# zero divisible
|
|
assert dataset._zero_divisible(matrix, k=3) == [
|
|
[1, 2, 0, 4, 5],
|
|
[0, 7, 8, 0, 10],
|
|
[11, 0, 13, 14, 0],
|
|
[16, 17, 0, 19, 20],
|
|
[0, 22, 23, 0, 25],
|
|
]
|
|
|
|
# crop
|
|
assert dataset._crop(matrix, row_start=2, row_end=4, col_start=1, col_end=3) == [
|
|
[6, 7, 8],
|
|
[11, 12, 13],
|
|
[16, 17, 18],
|
|
]
|
|
|
|
# remove every nth row
|
|
assert dataset._remove_every_nth_row(matrix, n=2) == [
|
|
[1, 2, 3, 4, 5],
|
|
[11, 12, 13, 14, 15],
|
|
[21, 22, 23, 24, 25],
|
|
]
|
|
|
|
# remove every nth col
|
|
assert dataset._remove_every_nth_col(matrix, n=2) == [
|
|
[1, 3, 5],
|
|
[6, 8, 10],
|
|
[11, 13, 15],
|
|
[16, 18, 20],
|
|
[21, 23, 25],
|
|
]
|