<pre style="word-wrap: break-word;white-space: pre-wrap;">from omni.isaac.kit import SimulationApp

# Start simulation app
simulation_app = SimulationApp({&quot;headless&quot;: False, &quot;renderer&quot;: &quot;RayTracedLighting&quot;})

import omni.replicator.core as rep
from pxr import UsdLux, Gf, UsdGeom, Usd, Sdf
import omni.usd
import numpy as np
import cv2
from ultralytics import YOLO
import matplotlib
matplotlib.use(&#039;Agg&#039;)
import matplotlib.pyplot as plt
import torch
import time

# Check CUDA availability
def assign_cuda_device():
    if torch.cuda.is_available():
        device = torch.device(&quot;cuda:0&quot;)
        torch.cuda.set_device(device)
        print(f&quot;Using CUDA device: {torch.cuda.current_device()} ({torch.cuda.get_device_name(0)})&quot;)
        return device
    else:
        print(&quot;CUDA is not available. Falling back to CPU.&quot;)
        return torch.device(&quot;cpu&quot;)

device = assign_cuda_device()

# Load stage
rep.new_layer()
stage_path = &quot;D:/isaaclab/_isaac_sim/Humanoid_sim/scena1.usd&quot;
omni.usd.get_context().open_stage(stage_path)

# Robot path
robot_path = &quot;/World/g1&quot;
camera_path = &quot;/World/g1/pelvis/robot_eye_camera&quot;  # If you placed it under head

# Wait for stage to load
stage = omni.usd.get_context().get_stage()
while stage is None:
    simulation_app.update()
    stage = omni.usd.get_context().get_stage()
    time.sleep(0.1)

# Verify robot and camera exist
robot_prim = stage.GetPrimAtPath(robot_path)
if not robot_prim.IsValid():
    raise RuntimeError(f&quot;Robot not found at path: {robot_path}&quot;)
print(f&quot;Found robot at: {robot_path}&quot;)

camera_prim = stage.GetPrimAtPath(camera_path)
if not camera_prim.IsValid():
    raise RuntimeError(f&quot;Camera not found at path: {camera_path}&quot;)
print(f&quot;Using new robot eye camera at: {camera_path}&quot;)

# Update simulation to ensure everything is loaded
for _ in range(20):
    simulation_app.update()

# Create render product
print(&quot;Setting up render product with camera in the stage...&quot;)
height, width = 1024, 1024
render_product = rep.create.render_product(camera_path, resolution=(width, height))
if render_product is None:
    raise RuntimeError(&quot;Failed to create render product&quot;)
print(f&quot;Successfully created render product for camera at {camera_path}&quot;)

# Annotator setup
annotator = rep.AnnotatorRegistry.get_annotator(&quot;rgb&quot;)
annotator.attach([render_product])
depth_annotator = rep.AnnotatorRegistry.get_annotator(&quot;distance_to_camera&quot;)

depth_annotator.attach([render_product])

# Start Replicator
rep.orchestrator.run()

#Capture image
captured_image = None
captured_depth = None

for i in range(10):
    simulation_app.update()
    rep.orchestrator.step()
    time.sleep(0.05)

    rgb_data = annotator.get_data()
    depth_data = depth_annotator.get_data()

    if rgb_data is not None and depth_data is not None and rgb_data.size &gt; 0 and depth_data.size &gt; 0:
        rgb_image = np.frombuffer(rgb_data, dtype=np.uint8).reshape((height, width, 4))[:, :, :3]
        depth_image = np.frombuffer(depth_data, dtype=np.float32).reshape((height, width))

        mean_brightness = np.mean(rgb_image)
        if mean_brightness &gt; 10.0:
            captured_image = rgb_image
            captured_depth = depth_image
            print(f&quot;Captured image and depth at frame {i}&quot;)
            cv2.imwrite(&quot;capture_rgb.png&quot;, cv2.cvtColor(rgb_image, cv2.COLOR_RGB2BGR))
            np.save(&quot;capture_depth.npy&quot;, depth_image)
            break
    else:
        print(f&quot;Frame {i}: No valid data received&quot;)

# ✅ Check this to avoid false RuntimeError
if captured_image is None or captured_depth is None:
    raise RuntimeError(&quot;Failed to capture a valid image after multiple attempts&quot;)

# Process captured image
image_rgb = captured_image.copy()
image_bgr = cv2.cvtColor(image_rgb, cv2.COLOR_RGB2BGR)
cv2.imwrite(&quot;humanoid_captured_image_fixed.png&quot;, image_bgr)
print(&quot;Saved captured image as &#039;humanoid_captured_image_fixed.png&#039;&quot;)
#depth_path = &quot;distance_to_camera_0000.npy&quot;
depth_map = captured_depth

# YOLO inference
image_normalized = image_bgr / 255.0
image_tensor = torch.from_numpy(image_normalized).permute(2, 0, 1).float().to(device).unsqueeze(0)
print(&quot;Loading YOLO model...&quot;)
# model = YOLO(&#039;yolov8l-oiv7.pt&#039;).to(device)
model = YOLO(&#039;yolov8x.pt&#039;).to(device)
print(&quot;Running YOLO inference...&quot;)
results = model(image_tensor)
for box in results[0].boxes.data:
    x1, y1, x2, y2 = map(int, box[:4])
    cx, cy = (x1 + x2) // 2, (y1 + y2) // 2
    distance = depth_map[cy, cx]

    class_id = int(box[5]) if len(box) &gt; 5 else -1
    class_name = model.names[class_id] if class_id in model.names else &quot;Unknown&quot;
    text = f&quot;{class_name}: {distance:.2f}m&quot;

    print(f&quot;Object at ({cx}, {cy}) has estimated distance: {distance:.2f} meters&quot;)

    # Draw on image
    cv2.rectangle(image_bgr, (int(x1), int(y1)), (int(x2), int(y2)), (0, 255, 0), 2)
    cv2.putText(image_bgr, text, (int(x1), int(y1) - 10),
                cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 255), 2)

# Print detection results
print(&quot;\n=== YOLO Detection Results ===&quot;)
print(&quot;YOLO classes:&quot;, model.names)
if len(results[0].boxes) &gt; 0:
    detected_classes = [results[0].names[int(cls)] for cls in results[0].boxes.cls]
    print(&quot;Detected classes:&quot;, detected_classes)
    print(&quot;Detected boxes:&quot;, results[0].boxes.data)
    print(&quot;Confidence scores:&quot;, results[0].boxes.conf)
else:
    print(&quot;No objects detected&quot;)

# Draw results
annotated_frame = results[0].plot()
annotated_rgb = cv2.cvtColor(annotated_frame, cv2.COLOR_BGR2RGB)
plt.figure(figsize=(15, 10))
plt.imshow(annotated_rgb)
plt.axis(&#039;off&#039;)
plt.title(&quot;YOLOv8 Detection from Stage Camera in Isaac Sim&quot;)
plt.savefig(&quot;humanoid_yolo_output_fixed.png&quot;, dpi=150, bbox_inches=&#039;tight&#039;)
plt.close()
print(&quot;Saved YOLO detection result as &#039;humanoid_yolo_output_fixed.png&#039;&quot;)
cv2.imwrite(&quot;humanoid_yolo_depth_overlay.png&quot;, image_bgr)
print(&quot;Saved image with YOLO detections and depth overlay&quot;)

# Save detection summary
detection_summary = f&quot;&quot;&quot;
Detection Summary:
- Total detections: {len(results[0].boxes)}
- Classes found: {[results[0].names[int(cls)] for cls in results[0].boxes.cls] if len(results[0].boxes) &gt; 0 else &#039;None&#039;}
- Image resolution: {width}x{height}
- Camera path: {camera_path}
- Robot path: {robot_path}
- Camera is fixed: True
&quot;&quot;&quot;
with open(&quot;detection_summary_fixed.txt&quot;, &quot;w&quot;) as f:
    f.write(detection_summary)
print(detection_summary)

# Cleanup
print(&quot;Cleaning up...&quot;)
annotator.detach()
omni.usd.get_context().close_stage()
simulation_app.close()
print(&quot;Simulation closed successfully&quot;)
</pre>