openvinotoolkit · maxxgx · May 15, 2026 · May 15, 2026 · May 17, 2026 · May 17, 2026
@@ -25,6 +25,12 @@ Physical AI Runtime provides the deployment-side components for running trained
 - **Inference Engine** — Load exported policies from Studio with auto-detected backends
 - **Policy Runtime** — Control loop with observation building and action dispatch
 
+---
+
+<p align="center">
+  <img src="docs/assets/inference_rerun.gif" alt="Inference demo" width="100%">
+</p>
+
 ## Installation
 
 ```bash

@@ -2,102 +2,171 @@
 # Copyright (C) 2026 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-"""Async inference with PolicyRuntime.
-
-python examples/runtime/async_inference.py \
-  --model ./exports/pi05_cans_openvino \
-  --device GPU.0 \
-  --port /dev/ttyACM0 \
-  --calibration /home/max/.cache/physicalai/robots/a8d8d997-a59e-4423-9006-5d991d223887/calibrations/0b2f185a-8ab2-4956-91c2-3a2ac2dbd8c1.json \
-  --overhead-camera /dev/v4l/by-id/usb-UGREEN_Camera_2K_UGREEN_Camera_2K_SN0001-video-index0 \
-  --arm-camera 353322271391 \
-  --front-camera /dev/v4l/by-id/usb-Innomaker_Innomaker-U20CAM-1080p-S1_SN0001-video-index0 \
-  --width 640 \
-  --height 480 \
-  --fps 30 \
-  --duration-s 60
+"""Run a trained policy on hardware with real-time Rerun visualization.
+
+Prerequisites::
+
+    uv sync --extra capture --extra robots --extra observer-rerun
+
+Examples:
+
+    # SO101 with 3 cameras, Rerun viewer auto-launched
+    python examples/runtime/async_inference.py \\
+      --robot so101 --port /dev/ttyACM0 --calibration ./cal.json \\
+      --model ./exports/my_model \\
+      --camera overhead:uvc:/dev/video0 \\
+      --camera arm:realsense:353322271391 \\
+      --camera front:uvc:/dev/video2 \\
+      --rerun spawn
+
+    # Trossen WidowXAI
+    python examples/runtime/async_inference.py \\
+      --robot widowxai --ip 192.168.1.2 \\
+      --model ./exports/my_model \\
+      --camera front:uvc:/dev/video0
+
+    # Bimanual Trossen WidowXAI
+    python examples/runtime/async_inference.py \\
+      --robot bimanual_widowxai --ip-left 192.168.1.2 --ip-right 192.168.1.3 \\
+      --model ./exports/my_model
+
+    # No --camera args → interactive selection
+    python examples/runtime/async_inference.py \\
+      --robot so101 --port /dev/ttyACM0 --calibration ./cal.json \\
+      --model ./exports/my_model --rerun spawn
 """
 
 from __future__ import annotations
 
 import argparse
+import os
+import signal
 
-import openvino as ov
-import numpy as np
-
-from physicalai.capture import discover_all
-from physicalai.capture.transport import SharedCamera
+from physicalai.capture import select_cameras_interactive
 from physicalai.inference import InferenceModel
-from physicalai.robot import SO101
 from physicalai.runtime import (
     ActionQueue,
     AsyncExecution,
     LerpSmoother,
     PolicyRuntime,
+    RerunCallback,
 )
 
+from utils import build_robot, parse_camera_specs
+
+
+def main() -> None:
+    # Force-exit on second Ctrl+C (Rerun's blocked channels prevent clean shutdown)
+    def _handle_sigint(sig: int, frame: object) -> None:
+        # Restore default handler so next Ctrl+C kills immediately via OS signal
+        signal.signal(signal.SIGINT, signal.SIG_DFL)
+        print("\nInterrupting... press Ctrl+C again to force kill.")
+        raise KeyboardInterrupt
+
+    signal.signal(signal.SIGINT, _handle_sigint)
+
+    parser = argparse.ArgumentParser(
+        description="Run a trained policy on hardware",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+
+    # Robot
+    robot_group = parser.add_argument_group("robot")
+    robot_group.add_argument("--robot", required=True, choices=("so101", "widowxai", "bimanual_widowxai"))
+    robot_group.add_argument("--port", help="Serial port (so101)")
+    robot_group.add_argument("--calibration", help="Calibration JSON path (so101)")
+    robot_group.add_argument("--ip", help="Robot IP (widowxai)")
+    robot_group.add_argument("--ip-left", help="Left arm IP (bimanual_widowxai)")
+    robot_group.add_argument("--ip-right", help="Right arm IP (bimanual_widowxai)")
+
+    # Model
+    model_group = parser.add_argument_group("model")
+    model_group.add_argument("--model", required=True, help="Exported model directory")
+    model_group.add_argument("--device", default="GPU", help="OpenVINO device (default: GPU)")
+
+    # Cameras
+    cam_group = parser.add_argument_group("cameras")
+    cam_group.add_argument(
+        "--camera", action="append", dest="cameras", metavar="NAME:DRIVER:DEVICE",
+        help="Camera as name:driver:device_id (repeatable). Omit for interactive selection.",
+    )
+    cam_group.add_argument("--cam-width", type=int, default=640, help="Camera width (default: 640)")
+    cam_group.add_argument("--cam-height", type=int, default=480, help="Camera height (default: 480)")
+    cam_group.add_argument("--cam-fps", type=int, default=30, help="Camera FPS (default: 30)")
+
+    # Runtime
+    rt_group = parser.add_argument_group("runtime")
+    rt_group.add_argument("--fps", type=float, default=30.0, help="Control loop FPS (default: 30)")
+    rt_group.add_argument("--duration-s", type=float, default=60.0, help="Duration in seconds")
+    rt_group.add_argument("--task", type=str, default=None, help="Task string for the model (e.g. 'pick up the can')")
+    rt_group.add_argument("--shared-camera", action="store_true", help="Use shared memory cameras (iceoryx2) — faster but incompatible with debugger")
+    rt_group.add_argument("--request-threshold", type=float, default=0.75, help="Request new inference when queue drops below this fraction of chunk_size (default: 0.75 = trigger when 75%% of actions remain)")
+    rt_group.add_argument("--lerp-frames", type=int, default=3, help="LerpSmoother blend duration in frames (default: 3)")
+
+    # Rerun
+    rr_group = parser.add_argument_group("rerun")
+    rr_group.add_argument("--rerun", choices=("off", "spawn", "connect", "save"), default="off")
+    rr_group.add_argument("--rerun-addr", default="127.0.0.1:9876")
+    rr_group.add_argument("--rerun-save-path", default="run.rrd")
+    rr_group.add_argument("--rerun-no-images", action="store_true", help="Scalars only")
+    rr_group.add_argument("--rerun-image-decimation", type=int, default=1, help="Only send 1/N frames to Rerun")
+    rr_group.add_argument("--rerun-jpeg-quality", type=int, default=None, help="JPEG quality for Rerun images (0-100, default: no re-encoding)")
+    rr_group.add_argument("--rerun-image-max-dim", type=int, default=None, help="Max width/height for Rerun images (default: no resizing)")
 
-def main():
-    parser = argparse.ArgumentParser(description="Run policy with PolicyRuntime")
-    parser.add_argument("--model", required=True, help="Exported model directory")
-    parser.add_argument("--device", default="GPU.0", help="OpenVINO device")
-    parser.add_argument("--port", default="/dev/ttyACM0", help="Robot serial port")
-    parser.add_argument("--calibration", required=True, help="Robot calibration file")
-    parser.add_argument("--overhead-camera", required=True, help="Overhead camera device path")
-    parser.add_argument("--arm-camera", required=True, help="Arm camera serial number")
-    parser.add_argument("--front-camera", required=True, help="Front camera device path")
-    parser.add_argument("--width", type=int, default=640)
-    parser.add_argument("--height", type=int, default=480)
-    parser.add_argument("--duration-s", type=float, default=60.0)
-    parser.add_argument("--fps", type=float, default=30.0)
     args = parser.parse_args()
 
+    # ── Load model ──
     import openvino_tokenizers  # noqa: F401 — registers OV tokenizer ops
 
-    print(f"Available devices:")
-    core = ov.Core()
-    devices = core.available_devices
-    for dev in devices:
-        print(f"  {dev}: {core.get_property(dev, 'FULL_DEVICE_NAME')}")
-    print(f"Selected device: {args.device}")
-
+    print(f"Loading model from {args.model} on {args.device} (this may take a minute)...", flush=True)
     model = InferenceModel.load(args.model, device=args.device)
-    robot = SO101(port=args.port, calibration=args.calibration, role="follower")
-    cameras = {
-        "overhead": SharedCamera("uvc", device=args.overhead_camera, width=args.width, height=args.height, fps=int(args.fps)),
-        "front": SharedCamera("uvc", device=args.front_camera, width=args.width, height=args.height, fps=int(args.fps)),
-        "arm": SharedCamera("realsense", serial_number=args.arm_camera, width=args.width, height=args.height, fps=int(args.fps)),
-    }
-
+    print("Model loaded.")
+
+    # ── Build robot & cameras ──
+    robot = build_robot(args)
+    if args.cameras:
+        cameras = parse_camera_specs(args.cameras, args.cam_width, args.cam_height, args.cam_fps, shared=args.shared_camera)
+    else:
+        cameras = select_cameras_interactive(args.cam_width, args.cam_height, args.cam_fps)
+
+    # ── Callbacks ──
+    callbacks: list = []
+    if args.rerun != "off":
+        callbacks.append(
+            RerunCallback(
+                cameras=cameras,
+                image_decimation=args.rerun_image_decimation,
+                log_images=not args.rerun_no_images,
+                image_jpeg_quality=args.rerun_jpeg_quality,
+                image_max_dim=args.rerun_image_max_dim,
+                mode=args.rerun,
+                connect_addr=args.rerun_addr,
+                save_path=args.rerun_save_path if args.rerun == "save" else None,
+            )
+        )
+
+    # ── Run ──
     runtime = PolicyRuntime(
         robot=robot,
         model=model,
-        execution=AsyncExecution(threshold=0.3, fps=int(args.fps)),
-        action_queue=ActionQueue(smoother=LerpSmoother(duration_frames=5)),
+        execution=AsyncExecution(request_threshold=args.request_threshold, fps=int(args.fps)),
+        action_queue=ActionQueue(smoother=LerpSmoother(duration_frames=args.lerp_frames)),
         cameras=cameras,
         fps=args.fps,
+        callbacks=callbacks,
+        task=args.task,
     )
 
-    try:
-        runtime.connect()
-    except Exception as e:
-        print(f"Failed to connect: {e}")
-        print("Available cameras:")
-        for driver, devices in discover_all().items():
-            for dev in devices:
-                print(f"  Driver: {driver}, Device: {dev.device_id}, Info: {dev.name}")
-        return
-
-    for name, cam in cameras.items():
-        print(f"Camera '{name}' connected: {cam.actual_width}x{cam.actual_height} @ {cam.actual_fps}fps")
-
-    print("Starting policy runtime...")
-    try:
+    with runtime:
+        for name, cam in cameras.items():
+            w = getattr(cam, "actual_width", None)
+            h = getattr(cam, "actual_height", None)
+            f = getattr(cam, "actual_fps", None)
+            print(f"  {name}: {w}x{h} @ {f}fps" if w and h else f"  {name}: connected")
+        print(f"Running at {args.fps} fps for {args.duration_s}s...")
         stats = runtime.run(duration_s=args.duration_s)
-        print(f"\nDone — {stats.steps} steps, {stats.inference_count} inferences, {stats.total_holds} holds")
-    finally:
-        runtime.disconnect()
-        print("Disconnected")
+
+    print(f"\nDone — {stats.steps} steps, {stats.inference_count} inferences, {stats.total_holds} holds")
 
 
 if __name__ == "__main__":