add pyrender_utils with test

2026-04-19 12:57:58 +00:00 · 2025-05-18 22:41:27 +00:00 · 2025-05-18 22:41:27 +00:00 · c10ebe4b85
commit c10ebe4b85
parent 96fd81daab
3 changed files with 271 additions and 0 deletions
--- a/environments/hack0/pyrender_utils.py
+++ b/environments/hack0/pyrender_utils.py
@ -0,0 +1,225 @@
+import os
+import numpy as np
+import trimesh
+import pyrender
+
+# Headless rendering with GPU acceleration (egl), for non-GPU environments omesa will be faster
+os.environ['PYOPENGL_PLATFORM'] = 'egl'
+
+def create_look_at_matrix(eye: np.ndarray, target: np.ndarray, up: np.ndarray) -> np.ndarray:
+    """
+    Create a look-at transformation matrix for a camera.
+    
+    eye - position of the camera
+    target - position the camera is looking at
+    up - up direction for the camera
+    
+    returns the 4x4 transformation matrix
+    """
+    eye = np.asarray(eye)
+    target = np.asarray(target)
+    up = np.asarray(up)
+    
+    # Forward vector (from eye to target)
+    forward = target - eye
+    forward = forward / np.linalg.norm(forward)
+    
+    # Side vector (right vector)
+    side = np.cross(forward, up)
+    side = side / np.linalg.norm(side)
+    
+    # Recompute up vector to ensure orthogonality
+    up = np.cross(side, forward)
+    up = up / np.linalg.norm(up)
+    
+    # Create the rotation matrix | NOTE: PyRender uses OpenGL convention
+    # where camera looks down negative z-axis
+    R = np.eye(4)
+    R[0, :3] = side
+    R[1, :3] = up
+    R[2, :3] = -forward
+    
+    T = np.eye(4) # translation matrix
+    T[:3, 3] = eye
+    
+    # The camera pose matrix is the inverse of the view matrix
+    # but we need to return the pose directly for pyrender
+    return T @ R
+
+class PyRenderOffline:
+    def __init__(self, width=224, height=224): # Standard CLIP image size
+        self.width = width
+        self.height = height
+        try:
+            self.renderer = pyrender.OffscreenRenderer(viewport_width=self.width, viewport_height=self.height, point_size=1.0)
+        except Exception as e:
+            print(f"Failed to initialize OffscreenRenderer (is a display server/EGL/OSMesa available?): {e}")
+            print("Try: pip install pyglet; or for headless: export PYOPENGL_PLATFORM=osmesa (or egl)")
+            self.renderer = None # Fallback or raise error
+            raise
+
+        # Create camera poses using explicit transformation matrices
+        
+        # Front view (looking along the -Z axis)
+        front_pose = np.array([
+            [1, 0, 0, 0],
+            [0, 1, 0, 0],
+            [0, 0, 1, 5],
+            [0, 0, 0, 1]
+        ])
+        
+        # Top view (looking along the -Y axis)
+        top_pose = np.array([
+            [1, 0, 0, 0],
+            [0, 0, 1, 5],
+            [0, -1, 0, 0],
+            [0, 0, 0, 1]
+        ])
+        
+        # Diagonal view (from upper corner)
+        side_pose = np.array([
+            [0.866, -0.25, 0.433, 3],  # Camera right vector
+            [0.0, 0.866, 0.5, 3],      # Camera up vector  
+            [-0.5, -0.433, 0.75, 5],   # Camera forward vector (pointing at origin)
+            [0, 0, 0, 1]
+        ])
+        
+        # Store camera poses
+        self.camera_poses = [front_pose, top_pose, side_pose]
+        
+        # Debug print for the camera poses cause it doesn't look right
+        # and I'm not a game developer lol
+        print("Camera poses:")
+        for i, pose in enumerate(self.camera_poses):
+            print(f"Camera {i}:\n{pose}")
+        
+        # slightly wider field of view to ensure objects are visible
+        self.camera = pyrender.PerspectiveCamera(yfov=np.pi / 2.5, aspectRatio=1.0)
+        
+        # Bright point light
+        self.light = pyrender.PointLight(color=[1.0, 1.0, 1.0], intensity=10.0)
+
+    def render_mesh_to_images(self, mesh_obj: trimesh.Trimesh):
+        if not self.renderer:
+            print("Renderer not initialized, cannot render.")
+            return [np.zeros((self.height, self.width, 3), dtype=np.uint8) for _ in range(3)]
+
+        print(f"Rendering mesh with {len(mesh_obj.vertices)} vertices and {len(mesh_obj.faces)} faces")
+        
+        images = []
+        
+        # Make a copy to avoid modifying original mesh
+        render_mesh = mesh_obj.copy()
+        
+        # Center and scale the mesh for visibility
+        render_mesh.apply_translation(-render_mesh.centroid)
+        scale_factor = 0.8 / np.max(render_mesh.extents)  # Scale to unit size but slightly smaller
+        render_mesh.apply_scale(scale_factor)
+        
+        # Create a ground plane
+        ground_plane = trimesh.creation.box([4.0, 4.0, 0.01])
+        ground_plane.apply_translation([0, 0, -0.5])
+        
+        # Color scheme for wireframe blueprint
+        blueprint_bg = [0.98, 0.98, 1.0, 1.0]        # Light blue background
+        wireframe_color = [0.0, 0.4, 0.8, 1.0]       # Medium bright blue for wireframes
+        grid_color = [0.0, 0.2, 0.4, 1.0]            # Darker blue for grid
+        
+        # Wireframe material for the edges - completely opaque
+        wireframe_material = pyrender.MetallicRoughnessMaterial(
+            baseColorFactor=wireframe_color,
+            metallicFactor=0.0,
+            roughnessFactor=1.0,
+            wireframe=True
+        )
+        
+        # Grid material for the ground plane
+        grid_material = pyrender.MetallicRoughnessMaterial(
+            baseColorFactor=grid_color,
+            metallicFactor=0.0,
+            roughnessFactor=1.0,
+            wireframe=True
+        )
+        
+        for i, pose in enumerate(self.camera_poses):
+            # Create a fresh scene with blueprint background
+            scene = pyrender.Scene(ambient_light=[0.8, 0.8, 0.95], bg_color=blueprint_bg)
+            
+            # Add ground plane as grid
+            plane_mesh = pyrender.Mesh.from_trimesh(ground_plane, material=grid_material)
+            scene.add(plane_mesh)
+            
+            # For wireframe rendering, we'll create line segments directly
+            edges = render_mesh.edges_unique
+            edge_vertices = []
+            edge_indices = []
+            
+            # Extract all edges for wireframe rendering
+            for _, edge in enumerate(edges):
+                v0_idx = len(edge_vertices)
+                edge_vertices.append(render_mesh.vertices[edge[0]])
+                edge_vertices.append(render_mesh.vertices[edge[1]])
+                edge_indices.append([v0_idx, v0_idx+1])
+            
+            # Create lines primitive for edges
+            if len(edge_vertices) > 0:
+                edge_verts = np.array(edge_vertices, dtype=np.float32)
+                edge_indices = np.array(edge_indices, dtype=np.uint32)
+                
+                # Create a primitive for the lines
+                primitive = pyrender.Primitive(
+                    positions=edge_verts,
+                    indices=edge_indices,
+                    mode=pyrender.constants.GLTF.LINES,
+                    material=wireframe_material
+                )
+                
+                # Create a mesh with just the line primitive
+                edge_mesh = pyrender.Mesh(primitives=[primitive])
+                scene.add(edge_mesh)
+            
+            # Add camera
+            scene.add(self.camera, pose=pose)
+            
+            # Add light from camera direction (key light)
+            scene.add(self.light, pose=pose)
+            
+            # Add second light from above for better visibility
+            top_light_pose = np.eye(4)
+            top_light_pose[1, 3] = 3.0
+            scene.add(self.light, pose=top_light_pose)
+            
+            try:
+                color, _ = self.renderer.render(scene)
+                
+                # Post-process to enhance blueprint effect
+                # Convert to float for processing
+                img_float = color.astype(np.float32) / 255.0
+                
+                # Add a subtle grid pattern to the background
+                grid_size = 40
+                grid_intensity = 0.02
+                
+                # Draw faint horizontal grid lines
+                for y in range(0, color.shape[0], grid_size):
+                    img_float[y:y+1, :, :] = np.minimum(img_float[y:y+1, :, :] + grid_intensity, 1.0)
+                
+                # Draw faint vertical grid lines
+                for x in range(0, color.shape[1], grid_size):
+                    img_float[:, x:x+1, :] = np.minimum(img_float[:, x:x+1, :] + grid_intensity, 1.0)
+                
+                # Convert back to uint8
+                processed_img = (img_float * 255).astype(np.uint8)
+                
+                images.append(processed_img)
+                print(f"Rendered wireframe view {i}")
+                
+            except Exception as e:
+                print(f"Error during rendering view {i}: {e}")
+                images.append(np.zeros((self.height, self.width, 3), dtype=np.uint8))
+        
+        return images
+
+    def __del__(self):
+        if self.renderer:
+            self.renderer.delete()