Spaces:
Running
on
Zero
Running
on
Zero
File size: 6,871 Bytes
ffbf761 e154ec4 44a5fb8 e154ec4 c78bea2 3533c8c c78bea2 e154ec4 c78bea2 e154ec4 ffbf761 c78bea2 44f6fd9 4106fee 44f6fd9 4106fee ffbf761 674aded c78bea2 ffbf761 c78bea2 674aded c78bea2 674aded c78bea2 e154ec4 c78bea2 ffbf761 674aded ffbf761 674aded c78bea2 ffbf761 4106fee c78bea2 4106fee c78bea2 4106fee 674aded ffbf761 c78bea2 674aded ffbf761 674aded 4106fee ffbf761 674aded ffbf761 674aded ffbf761 674aded 4106fee 674aded 4106fee 674aded ffbf761 674aded 2477854 50e34ab 4b2c00a 9be5775 c3b6f2a c78bea2 4b2c00a 50e34ab c78bea2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 |
import rerun as rr
import numpy as np
from typing import Dict, Any, List
from utils.geometry import vector3_to_numpy, euler_to_quaternion
def create_subject_box(frame: Dict[str, Any], dimensions: Dict[str, float]) -> Dict[str, np.ndarray]:
"""
Given a single frame (position, rotation) and subject's dimensions,
return the center and half_size for a box representation.
"""
position = vector3_to_numpy(frame['position'])
half_size = np.array([
dimensions['width'] / 2.0,
dimensions['height'] / 2.0,
dimensions['depth'] / 2.0
], dtype=np.float32)
return {
'center': position,
'half_size': half_size
}
class SimulationLogger:
def __init__(self):
rr.init("camera_simulation")
rr.log("world", rr.ViewCoordinates.RIGHT_HAND_Y_UP, timeless=True)
self.K = np.array([
[500, 0, 960],
[0, 500, 540],
[0, 0, 1]
])
def log_metadata(self, instructions: List[Dict[str, Any]]) -> None:
if not instructions:
return
rr.log(
"metadata/instructions",
rr.TextDocument(
"\n".join([
f"Instruction {i+1}:\n"
f" Movement: {inst.get('cameraMovement', 'N/A')}\n"
f" Easing: {inst.get('movementEasing', 'N/A')}\n"
f" Frames: {inst.get('frameCount', 'N/A')}\n"
f" Camera Angle: {inst.get('initialCameraAngle', 'N/A')}\n"
f" Shot Type: {inst.get('initialShotType', 'N/A')}\n"
f" Subject Index: {inst.get('subjectIndex', 'N/A')}"
for i, inst in enumerate(instructions)
])
),
timeless=True
)
def log_subjects(self, subjects: List[Dict[str, Any]]) -> None:
"""
Updated to handle dynamic subjects:
- Each subject has multiple frames (position, rotation).
- Subject dimensions (width, height, depth) remain constant across frames.
"""
if not subjects:
return
# For each subject, log each frame at a different time index.
for subject_idx, subject in enumerate(subjects):
dimensions = subject.get("dimensions", {})
frames = subject.get("frames", [])
label = subject.get('objectClass', f"Subject_{subject_idx}")
for frame_idx, frame in enumerate(frames):
rr.set_time_sequence("frame_idx", frame_idx)
try:
box_params = create_subject_box(frame, dimensions)
center = box_params['center']
half_size = box_params['half_size']
# Convert Euler angles to quaternion for rotation
rotation_q = euler_to_quaternion(frame['rotation'])
# 1) Log a transform for the subject so the box is placed at 'center' with correct rotation
rr.log(
f"world/subjects/subject_{subject_idx}",
rr.Transform3D(
translation=center,
rotation=rr.Quaternion(xyzw=rotation_q)
)
)
# 2) Log a box at the origin of the subject's local transform
rr.log(
f"world/subjects/subject_{subject_idx}/box",
rr.Boxes3D(
centers=np.array([[0.0, 0.0, 0.0]], dtype=np.float32),
half_sizes=np.array([half_size], dtype=np.float32),
colors=np.array([[0.8, 0.2, 0.2, 1.0]], dtype=np.float32),
labels=[label],
show_labels=False,
fill_mode="solid"
)
)
except Exception as e:
print(f"Error creating box parameters for subject {subject_idx}, frame {frame_idx}: {str(e)}")
def log_camera_trajectory(self, camera_frames: List[Dict[str, Any]]) -> None:
if not camera_frames:
return
try:
camera_positions = np.array([
vector3_to_numpy(frame['position']) for frame in camera_frames
])
rr.log(
"world/camera_trajectory",
rr.Points3D(
camera_positions,
colors=np.full((len(camera_positions), 4), [0.0, 0.8, 0.8, 1.0])
),
timeless=True
)
if len(camera_positions) > 1:
lines = np.stack([camera_positions[:-1], camera_positions[1:]], axis=1)
rr.log(
"world/camera_trajectory/line",
rr.LineStrips3D(
lines,
colors=[(0.0, 0.8, 0.8, 1.0)]
),
timeless=True
)
except Exception as e:
print(f"Error logging camera trajectory: {str(e)}")
def log_camera_frames(self, camera_frames: List[Dict[str, Any]]) -> None:
if not camera_frames:
return
for frame_idx, camera_frame in enumerate(camera_frames):
try:
rr.set_time_sequence("frame_idx", frame_idx)
position = vector3_to_numpy(camera_frame['position'])
rotation_q = euler_to_quaternion(camera_frame['angle'])
rr.log(
"world/camera",
rr.Transform3D(
translation=position,
rotation=rr.Quaternion(xyzw=rotation_q)
)
)
rr.log(
"world/camera/image",
rr.Pinhole(
image_from_camera=self.K,
width=1920,
height=1080
)
)
except Exception as e:
print(f"Error logging camera frame {frame_idx}: {str(e)}")
def log_helper_keyframes(self, helper_keyframes: List[Dict[str, Any]]) -> None:
if not helper_keyframes:
return
helper_positions = np.array([
vector3_to_numpy(frame['position']) for frame in helper_keyframes
])
rr.log(
"world/helper_keyframes",
rr.Points3D(
helper_positions,
radii=np.full(len(helper_positions), 0.03),
colors=np.full((len(helper_positions), 4), [1.0, 1.0, 0.0, 1.0]),
),
timeless=True
)
for keyframe_idx, helper_keyframe in enumerate(helper_keyframes):
try:
|